{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {
    "toc": "true"
   },
   "source": [
    "# Table of Contents\n",
    " <p><div class=\"lev1 toc-item\"><a href=\"#将数据进行初步整理\" data-toc-modified-id=\"将数据进行初步整理-1\"><span class=\"toc-item-num\">1&nbsp;&nbsp;</span>将数据进行初步整理</a></div><div class=\"lev2 toc-item\"><a href=\"#Year-2007\" data-toc-modified-id=\"Year-2007-11\"><span class=\"toc-item-num\">1.1&nbsp;&nbsp;</span>Year 2007</a></div>"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "collapsed": false
   },
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "\n",
    "% matplotlib inline"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "collapsed": true
   },
   "source": [
    "# 将数据进行初步整理"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Year 2007"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 2007年的数据，原始数据的单位为十亿美元"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 205,
   "metadata": {
    "collapsed": false,
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "the shape of DataFrame:  (2000, 9)\n",
      "年份                    int64\n",
      "排名(Rank)              int64\n",
      "公司名称(Company)        object\n",
      "所在国家或地区(Country)     object\n",
      "所在行业(Industry)       object\n",
      "销售收入(Sales)          object\n",
      "利润(Profits)          object\n",
      "总资产(Assets)          object\n",
      "市值(Market Vaue)     float64\n",
      "dtype: object\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>年份</th>\n",
       "      <th>排名(Rank)</th>\n",
       "      <th>公司名称(Company)</th>\n",
       "      <th>所在国家或地区(Country)</th>\n",
       "      <th>所在行业(Industry)</th>\n",
       "      <th>销售收入(Sales)</th>\n",
       "      <th>利润(Profits)</th>\n",
       "      <th>总资产(Assets)</th>\n",
       "      <th>市值(Market Vaue)</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2007</td>\n",
       "      <td>1</td>\n",
       "      <td>Citigroup /花旗集团</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>银行</td>\n",
       "      <td>146.56</td>\n",
       "      <td>21.54</td>\n",
       "      <td>1,884.32</td>\n",
       "      <td>247.42</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2007</td>\n",
       "      <td>2</td>\n",
       "      <td>Bank of America /美国银行</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>银行</td>\n",
       "      <td>116.57</td>\n",
       "      <td>21.13</td>\n",
       "      <td>1,459.74</td>\n",
       "      <td>226.61</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2007</td>\n",
       "      <td>3</td>\n",
       "      <td>HSBC Holdings/汇丰集团</td>\n",
       "      <td>英国(UK)</td>\n",
       "      <td>银行</td>\n",
       "      <td>121.51</td>\n",
       "      <td>16.63</td>\n",
       "      <td>1,860.76</td>\n",
       "      <td>202.29</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     年份  排名(Rank)          公司名称(Company) 所在国家或地区(Country) 所在行业(Industry)  \\\n",
       "0  2007         1        Citigroup /花旗集团           美国(US)             银行   \n",
       "1  2007         2  Bank of America /美国银行           美国(US)             银行   \n",
       "2  2007         3     HSBC Holdings/汇丰集团           英国(UK)             银行   \n",
       "\n",
       "  销售收入(Sales) 利润(Profits) 总资产(Assets)  市值(Market Vaue)  \n",
       "0      146.56       21.54    1,884.32           247.42  \n",
       "1      116.57       21.13    1,459.74           226.61  \n",
       "2      121.51       16.63    1,860.76           202.29  "
      ]
     },
     "execution_count": 205,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007 = pd.read_csv('./data/data_forbes_2007.csv', encoding='gbk', thousands=',')\n",
    "print('the shape of DataFrame: ', df_2007.shape)\n",
    "print(df_2007.dtypes)\n",
    "df_2007.head(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 更新columns的命名"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 206,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2007</td>\n",
       "      <td>1</td>\n",
       "      <td>Citigroup /花旗集团</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>银行</td>\n",
       "      <td>146.56</td>\n",
       "      <td>21.54</td>\n",
       "      <td>1,884.32</td>\n",
       "      <td>247.42</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2007</td>\n",
       "      <td>2</td>\n",
       "      <td>Bank of America /美国银行</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>银行</td>\n",
       "      <td>116.57</td>\n",
       "      <td>21.13</td>\n",
       "      <td>1,459.74</td>\n",
       "      <td>226.61</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2007</td>\n",
       "      <td>3</td>\n",
       "      <td>HSBC Holdings/汇丰集团</td>\n",
       "      <td>英国(UK)</td>\n",
       "      <td>银行</td>\n",
       "      <td>121.51</td>\n",
       "      <td>16.63</td>\n",
       "      <td>1,860.76</td>\n",
       "      <td>202.29</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Year  Rank          Company_cn_en Country_cn_en Industry_cn   Sales  \\\n",
       "0  2007     1        Citigroup /花旗集团        美国(US)          银行  146.56   \n",
       "1  2007     2  Bank of America /美国银行        美国(US)          银行  116.57   \n",
       "2  2007     3     HSBC Holdings/汇丰集团        英国(UK)          银行  121.51   \n",
       "\n",
       "  Profits    Assets  Market_value  \n",
       "0   21.54  1,884.32        247.42  \n",
       "1   21.13  1,459.74        226.61  \n",
       "2   16.63  1,860.76        202.29  "
      ]
     },
     "execution_count": 206,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "column_update = ['Year', 'Rank', 'Company_cn_en', 'Country_cn_en', \n",
    "                 'Industry_cn', 'Sales', 'Profits', 'Assets', 'Market_value']\n",
    "df_2007.columns = column_update\n",
    "df_2007.head(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* **通过前面的分析可看出，只有“Market_value”是数字类型，找出'Sales','Profits'及'Assets'中非数字的内容**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 207,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>117</th>\n",
       "      <td>2007</td>\n",
       "      <td>118</td>\n",
       "      <td>Repsol-YPF /瑞普索</td>\n",
       "      <td>西班牙(SP)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>64.20 E</td>\n",
       "      <td>4.12</td>\n",
       "      <td>58.43</td>\n",
       "      <td>38.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>616</th>\n",
       "      <td>2007</td>\n",
       "      <td>617</td>\n",
       "      <td>Inpex Holdings</td>\n",
       "      <td>日本(JA)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>6.49 E</td>\n",
       "      <td>1.02 E</td>\n",
       "      <td>10.77 E</td>\n",
       "      <td>19.65</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>880</th>\n",
       "      <td>2007</td>\n",
       "      <td>881</td>\n",
       "      <td>Asahi Breweries/朝日啤酒</td>\n",
       "      <td>日本(JA)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>7.97 E</td>\n",
       "      <td>0.38</td>\n",
       "      <td>10.66</td>\n",
       "      <td>7.71</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     Year  Rank         Company_cn_en Country_cn_en Industry_cn    Sales  \\\n",
       "117  2007   118       Repsol-YPF /瑞普索       西班牙(SP)          炼油  64.20 E   \n",
       "616  2007   617        Inpex Holdings        日本(JA)          炼油   6.49 E   \n",
       "880  2007   881  Asahi Breweries/朝日啤酒        日本(JA)    食品、饮料和烟草   7.97 E   \n",
       "\n",
       "    Profits   Assets  Market_value  \n",
       "117    4.12    58.43         38.75  \n",
       "616  1.02 E  10.77 E         19.65  \n",
       "880    0.38    10.66          7.71  "
      ]
     },
     "execution_count": 207,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007[df_2007['Sales'].str.contains('.*[A-Za-z]', regex=True)]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 用replace()方法替换“Sales”列中含有字母的内容"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 208,
   "metadata": {
    "collapsed": false,
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "df_2007['Sales'] = df_2007['Sales'].replace('([A-Za-z])', '', regex=True)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 查看替换后的结果"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 209,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>117</th>\n",
       "      <td>2007</td>\n",
       "      <td>118</td>\n",
       "      <td>Repsol-YPF /瑞普索</td>\n",
       "      <td>西班牙(SP)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>64.20</td>\n",
       "      <td>4.12</td>\n",
       "      <td>58.43</td>\n",
       "      <td>38.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>616</th>\n",
       "      <td>2007</td>\n",
       "      <td>617</td>\n",
       "      <td>Inpex Holdings</td>\n",
       "      <td>日本(JA)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>6.49</td>\n",
       "      <td>1.02 E</td>\n",
       "      <td>10.77 E</td>\n",
       "      <td>19.65</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>880</th>\n",
       "      <td>2007</td>\n",
       "      <td>881</td>\n",
       "      <td>Asahi Breweries/朝日啤酒</td>\n",
       "      <td>日本(JA)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>7.97</td>\n",
       "      <td>0.38</td>\n",
       "      <td>10.66</td>\n",
       "      <td>7.71</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     Year  Rank         Company_cn_en Country_cn_en Industry_cn   Sales  \\\n",
       "117  2007   118       Repsol-YPF /瑞普索       西班牙(SP)          炼油  64.20    \n",
       "616  2007   617        Inpex Holdings        日本(JA)          炼油   6.49    \n",
       "880  2007   881  Asahi Breweries/朝日啤酒        日本(JA)    食品、饮料和烟草   7.97    \n",
       "\n",
       "    Profits   Assets  Market_value  \n",
       "117    4.12    58.43         38.75  \n",
       "616  1.02 E  10.77 E         19.65  \n",
       "880    0.38    10.66          7.71  "
      ]
     },
     "execution_count": 209,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007.loc[[117,616,880], :]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* **查看“Assets”列中非数字的内容**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 210,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>616</th>\n",
       "      <td>2007</td>\n",
       "      <td>617</td>\n",
       "      <td>Inpex Holdings</td>\n",
       "      <td>日本(JA)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>6.49</td>\n",
       "      <td>1.02 E</td>\n",
       "      <td>10.77 E</td>\n",
       "      <td>19.65</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     Year  Rank   Company_cn_en Country_cn_en Industry_cn  Sales Profits  \\\n",
       "616  2007   617  Inpex Holdings        日本(JA)          炼油  6.49   1.02 E   \n",
       "\n",
       "      Assets  Market_value  \n",
       "616  10.77 E         19.65  "
      ]
     },
     "execution_count": 210,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007[df_2007['Assets'].str.contains('.*[A-Za-z]', regex=True)]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 替换非数字的内容，以及替换千分位间隔符号"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 211,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Year                       2007\n",
       "Rank                        617\n",
       "Company_cn_en    Inpex Holdings\n",
       "Country_cn_en            日本(JA)\n",
       "Industry_cn                  炼油\n",
       "Sales                     6.49 \n",
       "Profits                  1.02 E\n",
       "Assets                   10.77 \n",
       "Market_value              19.65\n",
       "Name: 616, dtype: object"
      ]
     },
     "execution_count": 211,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 将数字后面的字母进行替换\n",
    "df_2007['Assets'] = df_2007['Assets'].replace('([A-Za-z])', '', regex=True)\n",
    "\n",
    "# 千分位数字的逗号被识别为string了，需要替换\n",
    "df_2007['Assets'] = df_2007['Assets'].replace(',', '', regex=True)\n",
    "df_2007.loc[616, :]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* **发现“Profits”中有NaN值，需要先进行替换**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 212,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>958</th>\n",
       "      <td>2007</td>\n",
       "      <td>959</td>\n",
       "      <td>UAL/美国联合航空公司</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>运输</td>\n",
       "      <td>19.34</td>\n",
       "      <td>NaN</td>\n",
       "      <td>25.86</td>\n",
       "      <td>4.43</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1440</th>\n",
       "      <td>2007</td>\n",
       "      <td>1441</td>\n",
       "      <td>Owens Corning/欧文斯科宁</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>建筑</td>\n",
       "      <td>6.46</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.47</td>\n",
       "      <td>4.19</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1544</th>\n",
       "      <td>2007</td>\n",
       "      <td>1545</td>\n",
       "      <td>Parmalat/帕玛拉特公司</td>\n",
       "      <td>意大利(IT)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>4.83</td>\n",
       "      <td>NaN</td>\n",
       "      <td>4.90</td>\n",
       "      <td>7.02</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1912</th>\n",
       "      <td>2007</td>\n",
       "      <td>1912</td>\n",
       "      <td>Winn-Dixie Stores</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>食品市场</td>\n",
       "      <td>6.96</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.62</td>\n",
       "      <td>1.05</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      Year  Rank        Company_cn_en Country_cn_en Industry_cn  Sales  \\\n",
       "958   2007   959         UAL/美国联合航空公司        美国(US)          运输  19.34   \n",
       "1440  2007  1441  Owens Corning/欧文斯科宁        美国(US)          建筑   6.46   \n",
       "1544  2007  1545      Parmalat/帕玛拉特公司       意大利(IT)    食品、饮料和烟草   4.83   \n",
       "1912  2007  1912    Winn-Dixie Stores        美国(US)        食品市场   6.96   \n",
       "\n",
       "     Profits Assets  Market_value  \n",
       "958      NaN  25.86          4.43  \n",
       "1440     NaN   8.47          4.19  \n",
       "1544     NaN   4.90          7.02  \n",
       "1912     NaN   1.62          1.05  "
      ]
     },
     "execution_count": 212,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007[pd.isnull(df_2007['Profits'])]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 将NaN值填充为 0"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 213,
   "metadata": {
    "collapsed": false,
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>958</th>\n",
       "      <td>2007</td>\n",
       "      <td>959</td>\n",
       "      <td>UAL/美国联合航空公司</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>运输</td>\n",
       "      <td>19.34</td>\n",
       "      <td>0</td>\n",
       "      <td>25.86</td>\n",
       "      <td>4.43</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1440</th>\n",
       "      <td>2007</td>\n",
       "      <td>1441</td>\n",
       "      <td>Owens Corning/欧文斯科宁</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>建筑</td>\n",
       "      <td>6.46</td>\n",
       "      <td>0</td>\n",
       "      <td>8.47</td>\n",
       "      <td>4.19</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1544</th>\n",
       "      <td>2007</td>\n",
       "      <td>1545</td>\n",
       "      <td>Parmalat/帕玛拉特公司</td>\n",
       "      <td>意大利(IT)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>4.83</td>\n",
       "      <td>0</td>\n",
       "      <td>4.90</td>\n",
       "      <td>7.02</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1912</th>\n",
       "      <td>2007</td>\n",
       "      <td>1912</td>\n",
       "      <td>Winn-Dixie Stores</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>食品市场</td>\n",
       "      <td>6.96</td>\n",
       "      <td>0</td>\n",
       "      <td>1.62</td>\n",
       "      <td>1.05</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      Year  Rank        Company_cn_en Country_cn_en Industry_cn  Sales  \\\n",
       "958   2007   959         UAL/美国联合航空公司        美国(US)          运输  19.34   \n",
       "1440  2007  1441  Owens Corning/欧文斯科宁        美国(US)          建筑   6.46   \n",
       "1544  2007  1545      Parmalat/帕玛拉特公司       意大利(IT)    食品、饮料和烟草   4.83   \n",
       "1912  2007  1912    Winn-Dixie Stores        美国(US)        食品市场   6.96   \n",
       "\n",
       "     Profits Assets  Market_value  \n",
       "958        0  25.86          4.43  \n",
       "1440       0   8.47          4.19  \n",
       "1544       0   4.90          7.02  \n",
       "1912       0   1.62          1.05  "
      ]
     },
     "execution_count": 213,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007['Profits'].fillna(0, inplace=True)\n",
    "df_2007.loc[[958,1440,1544,1912], :]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 将“Profits”列中非数字的内容进行替换，并查看替换后的结果"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 214,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>117</th>\n",
       "      <td>2007</td>\n",
       "      <td>118</td>\n",
       "      <td>Repsol-YPF /瑞普索</td>\n",
       "      <td>西班牙(SP)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>64.20</td>\n",
       "      <td>4.12</td>\n",
       "      <td>58.43</td>\n",
       "      <td>38.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>616</th>\n",
       "      <td>2007</td>\n",
       "      <td>617</td>\n",
       "      <td>Inpex Holdings</td>\n",
       "      <td>日本(JA)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>6.49</td>\n",
       "      <td>1.02</td>\n",
       "      <td>10.77</td>\n",
       "      <td>19.65</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>880</th>\n",
       "      <td>2007</td>\n",
       "      <td>881</td>\n",
       "      <td>Asahi Breweries/朝日啤酒</td>\n",
       "      <td>日本(JA)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>7.97</td>\n",
       "      <td>0.38</td>\n",
       "      <td>10.66</td>\n",
       "      <td>7.71</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "     Year  Rank         Company_cn_en Country_cn_en Industry_cn   Sales  \\\n",
       "117  2007   118       Repsol-YPF /瑞普索       西班牙(SP)          炼油  64.20    \n",
       "616  2007   617        Inpex Holdings        日本(JA)          炼油   6.49    \n",
       "880  2007   881  Asahi Breweries/朝日啤酒        日本(JA)    食品、饮料和烟草   7.97    \n",
       "\n",
       "    Profits  Assets  Market_value  \n",
       "117    4.12   58.43         38.75  \n",
       "616   1.02   10.77          19.65  \n",
       "880    0.38   10.66          7.71  "
      ]
     },
     "execution_count": 214,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007['Profits'] = df_2007['Profits'].replace('([A-Za-z])', '', regex=True)\n",
    "df_2007.loc[[117,616,880], :]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* **将sting类型的数字转换为数据类型，这里使用 pd.to_numeric() 方法**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 215,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Year               int64\n",
       "Rank               int64\n",
       "Company_cn_en     object\n",
       "Country_cn_en     object\n",
       "Industry_cn       object\n",
       "Sales            float64\n",
       "Profits          float64\n",
       "Assets           float64\n",
       "Market_value     float64\n",
       "dtype: object"
      ]
     },
     "execution_count": 215,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007['Sales'] = pd.to_numeric(df_2007['Sales'])\n",
    "df_2007['Profits'] = pd.to_numeric(df_2007['Profits'])\n",
    "df_2007['Assets'] = pd.to_numeric(df_2007['Assets'])\n",
    "df_2007.dtypes"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {
    "collapsed": true
   },
   "source": [
    "* **拆分\"Company_cn_en\"列**，新生成两列，分别为公司英文名称和中文名称"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 216,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0           Citigroup \n",
      "1     Bank of America \n",
      "2        HSBC Holdings\n",
      "3    General Electric \n",
      "4      JPMorgan Chase \n",
      "Name: Company_en, dtype: object\n",
      "1995    NaN\n",
      "1996    NaN\n",
      "1997    NaN\n",
      "1998    NaN\n",
      "1999    NaN\n",
      "Name: Company_cn, dtype: object\n"
     ]
    }
   ],
   "source": [
    "df_2007['Company_en'],df_2007['Company_cn'] = df_2007['Company_cn_en'].str.split('/', 1).str\n",
    "print(df_2007['Company_en'][:5])\n",
    "print(df_2007['Company_cn'] [-5:])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 217,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "      <th>Company_en</th>\n",
       "      <th>Company_cn</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1997</th>\n",
       "      <td>2007</td>\n",
       "      <td>1998</td>\n",
       "      <td>CBOT Holdings</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.64</td>\n",
       "      <td>0.17</td>\n",
       "      <td>0.81</td>\n",
       "      <td>8.54</td>\n",
       "      <td>CBOT Holdings</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1998</th>\n",
       "      <td>2007</td>\n",
       "      <td>1998</td>\n",
       "      <td>Singapore Petroleum</td>\n",
       "      <td>新加坡(SI)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>5.59</td>\n",
       "      <td>0.19</td>\n",
       "      <td>2.05</td>\n",
       "      <td>1.50</td>\n",
       "      <td>Singapore Petroleum</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1999</th>\n",
       "      <td>2007</td>\n",
       "      <td>2000</td>\n",
       "      <td>DVB Bank</td>\n",
       "      <td>德国(GE)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.77</td>\n",
       "      <td>0.06</td>\n",
       "      <td>12.74</td>\n",
       "      <td>1.26</td>\n",
       "      <td>DVB Bank</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      Year  Rank        Company_cn_en Country_cn_en Industry_cn  Sales  \\\n",
       "1997  2007  1998        CBOT Holdings        美国(US)        综合金融   0.64   \n",
       "1998  2007  1998  Singapore Petroleum       新加坡(SI)          炼油   5.59   \n",
       "1999  2007  2000             DVB Bank        德国(GE)          银行   0.77   \n",
       "\n",
       "      Profits  Assets  Market_value           Company_en Company_cn  \n",
       "1997     0.17    0.81          8.54        CBOT Holdings        NaN  \n",
       "1998     0.19    2.05          1.50  Singapore Petroleum        NaN  \n",
       "1999     0.06   12.74          1.26             DVB Bank        NaN  "
      ]
     },
     "execution_count": 217,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007.tail(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* **拆分\"Country_cn_en\"列**，新生成两列，分别为国家中文名称和英文名称"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 218,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0    美国\n",
      "1    美国\n",
      "2    英国\n",
      "3    美国\n",
      "4    美国\n",
      "Name: Country_cn, dtype: object\n",
      "1995    US)\n",
      "1996    US)\n",
      "1997    US)\n",
      "1998    SI)\n",
      "1999    GE)\n",
      "Name: Country_en, dtype: object\n"
     ]
    }
   ],
   "source": [
    "df_2007['Country_cn'],df_2007['Country_en'] = df_2007['Country_cn_en'].str.split('(', 1).str\n",
    "print(df_2007['Country_cn'][:5])\n",
    "print(df_2007['Country_en'][-5:])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 由于国家的英文名称中，最后有半个括号，需要去除，用 Series.str.slice()方法\n",
    "* 参数表示选取从开始到倒数第二个，即不要括号\")\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 219,
   "metadata": {
    "collapsed": false,
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "      <th>Company_en</th>\n",
       "      <th>Company_cn</th>\n",
       "      <th>Country_cn</th>\n",
       "      <th>Country_en</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2007</td>\n",
       "      <td>1</td>\n",
       "      <td>Citigroup /花旗集团</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>银行</td>\n",
       "      <td>146.56</td>\n",
       "      <td>21.54</td>\n",
       "      <td>1884.32</td>\n",
       "      <td>247.42</td>\n",
       "      <td>Citigroup</td>\n",
       "      <td>花旗集团</td>\n",
       "      <td>美国</td>\n",
       "      <td>US</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2007</td>\n",
       "      <td>2</td>\n",
       "      <td>Bank of America /美国银行</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>银行</td>\n",
       "      <td>116.57</td>\n",
       "      <td>21.13</td>\n",
       "      <td>1459.74</td>\n",
       "      <td>226.61</td>\n",
       "      <td>Bank of America</td>\n",
       "      <td>美国银行</td>\n",
       "      <td>美国</td>\n",
       "      <td>US</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2007</td>\n",
       "      <td>3</td>\n",
       "      <td>HSBC Holdings/汇丰集团</td>\n",
       "      <td>英国(UK)</td>\n",
       "      <td>银行</td>\n",
       "      <td>121.51</td>\n",
       "      <td>16.63</td>\n",
       "      <td>1860.76</td>\n",
       "      <td>202.29</td>\n",
       "      <td>HSBC Holdings</td>\n",
       "      <td>汇丰集团</td>\n",
       "      <td>英国</td>\n",
       "      <td>UK</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Year  Rank          Company_cn_en Country_cn_en Industry_cn   Sales  \\\n",
       "0  2007     1        Citigroup /花旗集团        美国(US)          银行  146.56   \n",
       "1  2007     2  Bank of America /美国银行        美国(US)          银行  116.57   \n",
       "2  2007     3     HSBC Holdings/汇丰集团        英国(UK)          银行  121.51   \n",
       "\n",
       "   Profits   Assets  Market_value        Company_en Company_cn Country_cn  \\\n",
       "0    21.54  1884.32        247.42        Citigroup        花旗集团         美国   \n",
       "1    21.13  1459.74        226.61  Bank of America        美国银行         美国   \n",
       "2    16.63  1860.76        202.29     HSBC Holdings       汇丰集团         英国   \n",
       "\n",
       "  Country_en  \n",
       "0         US  \n",
       "1         US  \n",
       "2         UK  "
      ]
     },
     "execution_count": 219,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007['Country_en'] = df_2007['Country_en'].str.slice(0,-1)\n",
    "df_2007.head(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 考虑的中国的企业有区分为中国大陆，中国香港，中国台湾\n",
    "* 对应的国家英文名称也需要修改下\n",
    "* 中国大陆：CN；中国香港：CN-HK；中国台湾：CN-TA"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 220,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "      <th>Company_en</th>\n",
       "      <th>Company_cn</th>\n",
       "      <th>Country_cn</th>\n",
       "      <th>Country_en</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>2007</td>\n",
       "      <td>41</td>\n",
       "      <td>PetroChina /中国石油</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>68.43</td>\n",
       "      <td>16.53</td>\n",
       "      <td>96.42</td>\n",
       "      <td>208.76</td>\n",
       "      <td>PetroChina</td>\n",
       "      <td>中国石油</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>52</th>\n",
       "      <td>2007</td>\n",
       "      <td>53</td>\n",
       "      <td>ICBC /中国工商银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>31.98</td>\n",
       "      <td>4.65</td>\n",
       "      <td>800.04</td>\n",
       "      <td>176.03</td>\n",
       "      <td>ICBC</td>\n",
       "      <td>中国工商银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>2007</td>\n",
       "      <td>69</td>\n",
       "      <td>CCB-China Construction Bank /中国建设银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>23.18</td>\n",
       "      <td>5.84</td>\n",
       "      <td>568.21</td>\n",
       "      <td>126.55</td>\n",
       "      <td>CCB-China Construction Bank</td>\n",
       "      <td>中国建设银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>2007</td>\n",
       "      <td>71</td>\n",
       "      <td>Sinopec-China Petroleum /中石化</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>99.03</td>\n",
       "      <td>5.07</td>\n",
       "      <td>65.83</td>\n",
       "      <td>93.57</td>\n",
       "      <td>Sinopec-China Petroleum</td>\n",
       "      <td>中石化</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>81</th>\n",
       "      <td>2007</td>\n",
       "      <td>82</td>\n",
       "      <td>Bank of China /中国银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>23.10</td>\n",
       "      <td>3.41</td>\n",
       "      <td>585.55</td>\n",
       "      <td>143.80</td>\n",
       "      <td>Bank of China</td>\n",
       "      <td>中国银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>88</th>\n",
       "      <td>2007</td>\n",
       "      <td>89</td>\n",
       "      <td>China Mobile /中国移动</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>29.79</td>\n",
       "      <td>6.56</td>\n",
       "      <td>51.35</td>\n",
       "      <td>185.31</td>\n",
       "      <td>China Mobile</td>\n",
       "      <td>中国移动</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>175</th>\n",
       "      <td>2007</td>\n",
       "      <td>176</td>\n",
       "      <td>Hutchison Whampoa/和记黄埔</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>多元化</td>\n",
       "      <td>23.55</td>\n",
       "      <td>1.85</td>\n",
       "      <td>74.97</td>\n",
       "      <td>40.57</td>\n",
       "      <td>Hutchison Whampoa</td>\n",
       "      <td>和记黄埔</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>180</th>\n",
       "      <td>2007</td>\n",
       "      <td>181</td>\n",
       "      <td>China Telecom/中国电信</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>20.98</td>\n",
       "      <td>3.46</td>\n",
       "      <td>50.34</td>\n",
       "      <td>37.50</td>\n",
       "      <td>China Telecom</td>\n",
       "      <td>中国电信</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>242</th>\n",
       "      <td>2007</td>\n",
       "      <td>243</td>\n",
       "      <td>China Life Insurance /中国人寿</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>保险</td>\n",
       "      <td>11.18</td>\n",
       "      <td>1.15</td>\n",
       "      <td>69.30</td>\n",
       "      <td>109.96</td>\n",
       "      <td>China Life Insurance</td>\n",
       "      <td>中国人寿</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>307</th>\n",
       "      <td>2007</td>\n",
       "      <td>308</td>\n",
       "      <td>Bank of Communications/中国交通银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>6.64</td>\n",
       "      <td>1.15</td>\n",
       "      <td>176.27</td>\n",
       "      <td>46.14</td>\n",
       "      <td>Bank of Communications</td>\n",
       "      <td>中国交通银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>309</th>\n",
       "      <td>2007</td>\n",
       "      <td>310</td>\n",
       "      <td>Taiwan Semiconductor/台积电</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>半导体</td>\n",
       "      <td>9.74</td>\n",
       "      <td>3.90</td>\n",
       "      <td>18.02</td>\n",
       "      <td>54.32</td>\n",
       "      <td>Taiwan Semiconductor</td>\n",
       "      <td>台积电</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>2007</td>\n",
       "      <td>341</td>\n",
       "      <td>Hon Hai Precision Ind /鸿海精密</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>27.78</td>\n",
       "      <td>1.24</td>\n",
       "      <td>13.99</td>\n",
       "      <td>34.83</td>\n",
       "      <td>Hon Hai Precision Ind</td>\n",
       "      <td>鸿海精密</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>365</th>\n",
       "      <td>2007</td>\n",
       "      <td>366</td>\n",
       "      <td>Baoshan Iron &amp; Steel /上海宝钢集团</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>15.63</td>\n",
       "      <td>1.57</td>\n",
       "      <td>17.59</td>\n",
       "      <td>21.42</td>\n",
       "      <td>Baoshan Iron &amp; Steel</td>\n",
       "      <td>上海宝钢集团</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>388</th>\n",
       "      <td>2007</td>\n",
       "      <td>389</td>\n",
       "      <td>Cathay Financial/国泰金融</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>保险</td>\n",
       "      <td>10.09</td>\n",
       "      <td>0.66</td>\n",
       "      <td>93.29</td>\n",
       "      <td>19.87</td>\n",
       "      <td>Cathay Financial</td>\n",
       "      <td>国泰金融</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>394</th>\n",
       "      <td>2007</td>\n",
       "      <td>395</td>\n",
       "      <td>Cnooc /中海油</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>8.51</td>\n",
       "      <td>3.10</td>\n",
       "      <td>14.22</td>\n",
       "      <td>34.94</td>\n",
       "      <td>Cnooc</td>\n",
       "      <td>中海油</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>400</th>\n",
       "      <td>2007</td>\n",
       "      <td>401</td>\n",
       "      <td>China Netcom Group /中国网通</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>10.69</td>\n",
       "      <td>1.70</td>\n",
       "      <td>24.70</td>\n",
       "      <td>15.70</td>\n",
       "      <td>China Netcom Group</td>\n",
       "      <td>中国网通</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>422</th>\n",
       "      <td>2007</td>\n",
       "      <td>423</td>\n",
       "      <td>China Shenhua Energy/中国神华能源股份有限公司</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>6.47</td>\n",
       "      <td>1.94</td>\n",
       "      <td>17.08</td>\n",
       "      <td>45.94</td>\n",
       "      <td>China Shenhua Energy</td>\n",
       "      <td>中国神华能源股份有限公司</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>429</th>\n",
       "      <td>2007</td>\n",
       "      <td>430</td>\n",
       "      <td>BOC Hong Kong/中银香港</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>4.13</td>\n",
       "      <td>1.74</td>\n",
       "      <td>106.03</td>\n",
       "      <td>25.58</td>\n",
       "      <td>BOC Hong Kong</td>\n",
       "      <td>中银香港</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>436</th>\n",
       "      <td>2007</td>\n",
       "      <td>437</td>\n",
       "      <td>Formosa Petrochemical/台塑石化</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>13.56</td>\n",
       "      <td>1.74</td>\n",
       "      <td>12.35</td>\n",
       "      <td>19.28</td>\n",
       "      <td>Formosa Petrochemical</td>\n",
       "      <td>台塑石化</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>439</th>\n",
       "      <td>2007</td>\n",
       "      <td>440</td>\n",
       "      <td>Ping An Insurance Group/平安保险</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>保险</td>\n",
       "      <td>7.95</td>\n",
       "      <td>0.52</td>\n",
       "      <td>39.62</td>\n",
       "      <td>39.60</td>\n",
       "      <td>Ping An Insurance Group</td>\n",
       "      <td>平安保险</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>451</th>\n",
       "      <td>2007</td>\n",
       "      <td>452</td>\n",
       "      <td>Jardine Matheson/香港怡和集团</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>食品市场</td>\n",
       "      <td>11.96</td>\n",
       "      <td>1.25</td>\n",
       "      <td>18.34</td>\n",
       "      <td>13.59</td>\n",
       "      <td>Jardine Matheson</td>\n",
       "      <td>香港怡和集团</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>510</th>\n",
       "      <td>2007</td>\n",
       "      <td>511</td>\n",
       "      <td>Sun Hung Kai Properties /新鸿基房地产</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>3.30</td>\n",
       "      <td>2.56</td>\n",
       "      <td>29.72</td>\n",
       "      <td>29.49</td>\n",
       "      <td>Sun Hung Kai Properties</td>\n",
       "      <td>新鸿基房地产</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>541</th>\n",
       "      <td>2007</td>\n",
       "      <td>542</td>\n",
       "      <td>China Unicom /中国联通</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>10.67</td>\n",
       "      <td>0.60</td>\n",
       "      <td>17.63</td>\n",
       "      <td>16.03</td>\n",
       "      <td>China Unicom</td>\n",
       "      <td>中国联通</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>551</th>\n",
       "      <td>2007</td>\n",
       "      <td>552</td>\n",
       "      <td>CLP Holdings /中电控股</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>公用事业</td>\n",
       "      <td>5.87</td>\n",
       "      <td>1.27</td>\n",
       "      <td>16.42</td>\n",
       "      <td>17.65</td>\n",
       "      <td>CLP Holdings</td>\n",
       "      <td>中电控股</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>575</th>\n",
       "      <td>2007</td>\n",
       "      <td>576</td>\n",
       "      <td>Chunghwa Telecom/中华电信</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>5.59</td>\n",
       "      <td>1.45</td>\n",
       "      <td>13.98</td>\n",
       "      <td>18.22</td>\n",
       "      <td>Chunghwa Telecom</td>\n",
       "      <td>中华电信</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>600</th>\n",
       "      <td>2007</td>\n",
       "      <td>601</td>\n",
       "      <td>China Steel/台湾中钢公司</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>材料</td>\n",
       "      <td>8.66</td>\n",
       "      <td>1.54</td>\n",
       "      <td>10.35</td>\n",
       "      <td>12.24</td>\n",
       "      <td>China Steel</td>\n",
       "      <td>台湾中钢公司</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>603</th>\n",
       "      <td>2007</td>\n",
       "      <td>604</td>\n",
       "      <td>China Merchants Bank/招商银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>3.53</td>\n",
       "      <td>0.46</td>\n",
       "      <td>90.76</td>\n",
       "      <td>33.19</td>\n",
       "      <td>China Merchants Bank</td>\n",
       "      <td>招商银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>617</th>\n",
       "      <td>2007</td>\n",
       "      <td>617</td>\n",
       "      <td>Nan Ya Plastic/南亚塑胶工业</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>化学制品</td>\n",
       "      <td>7.64</td>\n",
       "      <td>1.22</td>\n",
       "      <td>11.47</td>\n",
       "      <td>13.37</td>\n",
       "      <td>Nan Ya Plastic</td>\n",
       "      <td>南亚塑胶工业</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>627</th>\n",
       "      <td>2007</td>\n",
       "      <td>628</td>\n",
       "      <td>Cheung Kong/长江集团</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.80</td>\n",
       "      <td>1.80</td>\n",
       "      <td>28.01</td>\n",
       "      <td>28.39</td>\n",
       "      <td>Cheung Kong</td>\n",
       "      <td>长江集团</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>736</th>\n",
       "      <td>2007</td>\n",
       "      <td>737</td>\n",
       "      <td>Swire Pacific /太古集团</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>多元化</td>\n",
       "      <td>2.44</td>\n",
       "      <td>2.42</td>\n",
       "      <td>16.05</td>\n",
       "      <td>17.32</td>\n",
       "      <td>Swire Pacific</td>\n",
       "      <td>太古集团</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1636</th>\n",
       "      <td>2007</td>\n",
       "      <td>1637</td>\n",
       "      <td>Champion REIT</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.05</td>\n",
       "      <td>1.16</td>\n",
       "      <td>2.95</td>\n",
       "      <td>1.54</td>\n",
       "      <td>Champion REIT</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1641</th>\n",
       "      <td>2007</td>\n",
       "      <td>1642</td>\n",
       "      <td>Noble Group</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>13.75</td>\n",
       "      <td>0.13</td>\n",
       "      <td>3.81</td>\n",
       "      <td>2.14</td>\n",
       "      <td>Noble Group</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1661</th>\n",
       "      <td>2007</td>\n",
       "      <td>1662</td>\n",
       "      <td>Taiwan Mobile</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>1.81</td>\n",
       "      <td>0.50</td>\n",
       "      <td>3.59</td>\n",
       "      <td>4.84</td>\n",
       "      <td>Taiwan Mobile</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1681</th>\n",
       "      <td>2007</td>\n",
       "      <td>1682</td>\n",
       "      <td>Evergreen Marine</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>运输</td>\n",
       "      <td>4.29</td>\n",
       "      <td>0.37</td>\n",
       "      <td>3.96</td>\n",
       "      <td>1.90</td>\n",
       "      <td>Evergreen Marine</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1692</th>\n",
       "      <td>2007</td>\n",
       "      <td>1693</td>\n",
       "      <td>China Southern Airlines</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>4.64</td>\n",
       "      <td>-0.23</td>\n",
       "      <td>8.84</td>\n",
       "      <td>1.97</td>\n",
       "      <td>China Southern Airlines</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1705</th>\n",
       "      <td>2007</td>\n",
       "      <td>1706</td>\n",
       "      <td>Cosco Pacific</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>0.30</td>\n",
       "      <td>0.34</td>\n",
       "      <td>2.85</td>\n",
       "      <td>5.94</td>\n",
       "      <td>Cosco Pacific</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1710</th>\n",
       "      <td>2007</td>\n",
       "      <td>1711</td>\n",
       "      <td>China Shipping Container</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>3.52</td>\n",
       "      <td>0.44</td>\n",
       "      <td>3.59</td>\n",
       "      <td>2.26</td>\n",
       "      <td>China Shipping Container</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1736</th>\n",
       "      <td>2007</td>\n",
       "      <td>1737</td>\n",
       "      <td>China Resources Power Holdings</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>公用事业</td>\n",
       "      <td>0.76</td>\n",
       "      <td>0.37</td>\n",
       "      <td>3.67</td>\n",
       "      <td>5.37</td>\n",
       "      <td>China Resources Power Holdings</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1739</th>\n",
       "      <td>2007</td>\n",
       "      <td>1740</td>\n",
       "      <td>Citic Securities</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.14</td>\n",
       "      <td>0.04</td>\n",
       "      <td>2.52</td>\n",
       "      <td>14.29</td>\n",
       "      <td>Citic Securities</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1780</th>\n",
       "      <td>2007</td>\n",
       "      <td>1781</td>\n",
       "      <td>Far EasTone Telecom</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>2.19</td>\n",
       "      <td>0.45</td>\n",
       "      <td>3.01</td>\n",
       "      <td>4.45</td>\n",
       "      <td>Far EasTone Telecom</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1786</th>\n",
       "      <td>2007</td>\n",
       "      <td>1787</td>\n",
       "      <td>E.Sun Financial</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.73</td>\n",
       "      <td>0.14</td>\n",
       "      <td>19.36</td>\n",
       "      <td>2.19</td>\n",
       "      <td>E.Sun Financial</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1824</th>\n",
       "      <td>2007</td>\n",
       "      <td>1825</td>\n",
       "      <td>Minmetals Development</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>贸易公司</td>\n",
       "      <td>8.25</td>\n",
       "      <td>0.04</td>\n",
       "      <td>3.46</td>\n",
       "      <td>1.50</td>\n",
       "      <td>Minmetals Development</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1840</th>\n",
       "      <td>2007</td>\n",
       "      <td>1841</td>\n",
       "      <td>Shanghai Automotive</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>耐用消费品</td>\n",
       "      <td>0.79</td>\n",
       "      <td>0.14</td>\n",
       "      <td>1.81</td>\n",
       "      <td>11.10</td>\n",
       "      <td>Shanghai Automotive</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1846</th>\n",
       "      <td>2007</td>\n",
       "      <td>1847</td>\n",
       "      <td>HK Exchanges &amp; Clearing</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.35</td>\n",
       "      <td>0.17</td>\n",
       "      <td>2.96</td>\n",
       "      <td>10.97</td>\n",
       "      <td>HK Exchanges &amp; Clearing</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1852</th>\n",
       "      <td>2007</td>\n",
       "      <td>1853</td>\n",
       "      <td>Link REIT</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.43</td>\n",
       "      <td>0.27</td>\n",
       "      <td>5.24</td>\n",
       "      <td>5.00</td>\n",
       "      <td>Link REIT</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1860</th>\n",
       "      <td>2007</td>\n",
       "      <td>1861</td>\n",
       "      <td>Kweichow Moutai</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>0.43</td>\n",
       "      <td>0.14</td>\n",
       "      <td>1.00</td>\n",
       "      <td>10.69</td>\n",
       "      <td>Kweichow Moutai</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1892</th>\n",
       "      <td>2007</td>\n",
       "      <td>1892</td>\n",
       "      <td>Yanzhou Coal Mining</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>1.43</td>\n",
       "      <td>0.36</td>\n",
       "      <td>2.63</td>\n",
       "      <td>4.52</td>\n",
       "      <td>Yanzhou Coal Mining</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1908</th>\n",
       "      <td>2007</td>\n",
       "      <td>1909</td>\n",
       "      <td>China Shipping Develop</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>1.06</td>\n",
       "      <td>0.33</td>\n",
       "      <td>1.66</td>\n",
       "      <td>4.61</td>\n",
       "      <td>China Shipping Develop</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1920</th>\n",
       "      <td>2007</td>\n",
       "      <td>1920</td>\n",
       "      <td>Wing Lung Bank</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.66</td>\n",
       "      <td>0.21</td>\n",
       "      <td>10.92</td>\n",
       "      <td>2.43</td>\n",
       "      <td>Wing Lung Bank</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1922</th>\n",
       "      <td>2007</td>\n",
       "      <td>1923</td>\n",
       "      <td>Delta Electronics</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>2.46</td>\n",
       "      <td>0.23</td>\n",
       "      <td>2.49</td>\n",
       "      <td>6.40</td>\n",
       "      <td>Delta Electronics</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1945</th>\n",
       "      <td>2007</td>\n",
       "      <td>1946</td>\n",
       "      <td>China Airlines</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>运输</td>\n",
       "      <td>3.61</td>\n",
       "      <td>0.02</td>\n",
       "      <td>7.63</td>\n",
       "      <td>1.85</td>\n",
       "      <td>China Airlines</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1948</th>\n",
       "      <td>2007</td>\n",
       "      <td>1949</td>\n",
       "      <td>Wing Hang Bank</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.66</td>\n",
       "      <td>0.17</td>\n",
       "      <td>13.45</td>\n",
       "      <td>3.33</td>\n",
       "      <td>Wing Hang Bank</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1959</th>\n",
       "      <td>2007</td>\n",
       "      <td>1959</td>\n",
       "      <td>PCCW</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>2.90</td>\n",
       "      <td>0.21</td>\n",
       "      <td>6.87</td>\n",
       "      <td>3.98</td>\n",
       "      <td>PCCW</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1960</th>\n",
       "      <td>2007</td>\n",
       "      <td>1961</td>\n",
       "      <td>Benq</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>5.39</td>\n",
       "      <td>-0.16</td>\n",
       "      <td>5.04</td>\n",
       "      <td>1.27</td>\n",
       "      <td>Benq</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1963</th>\n",
       "      <td>2007</td>\n",
       "      <td>1964</td>\n",
       "      <td>TCL Corp</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>6.40</td>\n",
       "      <td>-0.04</td>\n",
       "      <td>3.77</td>\n",
       "      <td>1.39</td>\n",
       "      <td>TCL Corp</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1970</th>\n",
       "      <td>2007</td>\n",
       "      <td>1971</td>\n",
       "      <td>Wuliangye Yibin</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>0.70</td>\n",
       "      <td>0.10</td>\n",
       "      <td>1.19</td>\n",
       "      <td>8.81</td>\n",
       "      <td>Wuliangye Yibin</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1973</th>\n",
       "      <td>2007</td>\n",
       "      <td>1974</td>\n",
       "      <td>CNPC (Hong Kong)</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>0.44</td>\n",
       "      <td>0.47</td>\n",
       "      <td>2.07</td>\n",
       "      <td>2.30</td>\n",
       "      <td>CNPC (Hong Kong)</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1975</th>\n",
       "      <td>2007</td>\n",
       "      <td>1976</td>\n",
       "      <td>K Wah International</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.04</td>\n",
       "      <td>0.47</td>\n",
       "      <td>1.29</td>\n",
       "      <td>0.98</td>\n",
       "      <td>K Wah International</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1986</th>\n",
       "      <td>2007</td>\n",
       "      <td>1987</td>\n",
       "      <td>China Overseas Land &amp; Inv</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.90</td>\n",
       "      <td>0.20</td>\n",
       "      <td>3.24</td>\n",
       "      <td>7.05</td>\n",
       "      <td>China Overseas Land &amp; Inv</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1989</th>\n",
       "      <td>2007</td>\n",
       "      <td>1989</td>\n",
       "      <td>Nine Dragons Paper Holdings</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>0.99</td>\n",
       "      <td>0.17</td>\n",
       "      <td>1.86</td>\n",
       "      <td>8.61</td>\n",
       "      <td>Nine Dragons Paper Holdings</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>HK)/中国大陆(CN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>131 rows × 13 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      Year  Rank                        Company_cn_en      Country_cn_en  \\\n",
       "40    2007    41                     PetroChina /中国石油           中国大陆(CN)   \n",
       "52    2007    53                         ICBC /中国工商银行           中国大陆(CN)   \n",
       "68    2007    69  CCB-China Construction Bank /中国建设银行           中国大陆(CN)   \n",
       "70    2007    71         Sinopec-China Petroleum /中石化           中国大陆(CN)   \n",
       "81    2007    82                  Bank of China /中国银行           中国大陆(CN)   \n",
       "88    2007    89                   China Mobile /中国移动  中国香港(HK)/中国大陆(CN)   \n",
       "175   2007   176               Hutchison Whampoa/和记黄埔  中国香港(HK)/中国大陆(CN)   \n",
       "180   2007   181                   China Telecom/中国电信           中国大陆(CN)   \n",
       "242   2007   243           China Life Insurance /中国人寿           中国大陆(CN)   \n",
       "307   2007   308        Bank of Communications/中国交通银行           中国大陆(CN)   \n",
       "309   2007   310             Taiwan Semiconductor/台积电           中国台湾(TA)   \n",
       "340   2007   341          Hon Hai Precision Ind /鸿海精密           中国台湾(TA)   \n",
       "365   2007   366         Baoshan Iron & Steel /上海宝钢集团           中国大陆(CN)   \n",
       "388   2007   389                Cathay Financial/国泰金融           中国台湾(TA)   \n",
       "394   2007   395                           Cnooc /中海油  中国香港(HK)/中国大陆(CN)   \n",
       "400   2007   401             China Netcom Group /中国网通  中国香港(HK)/中国大陆(CN)   \n",
       "422   2007   423    China Shenhua Energy/中国神华能源股份有限公司           中国大陆(CN)   \n",
       "429   2007   430                   BOC Hong Kong/中银香港  中国香港(HK)/中国大陆(CN)   \n",
       "436   2007   437           Formosa Petrochemical/台塑石化           中国台湾(TA)   \n",
       "439   2007   440         Ping An Insurance Group/平安保险           中国大陆(CN)   \n",
       "451   2007   452              Jardine Matheson/香港怡和集团  中国香港(HK)/中国大陆(CN)   \n",
       "510   2007   511      Sun Hung Kai Properties /新鸿基房地产  中国香港(HK)/中国大陆(CN)   \n",
       "541   2007   542                   China Unicom /中国联通  中国香港(HK)/中国大陆(CN)   \n",
       "551   2007   552                   CLP Holdings /中电控股  中国香港(HK)/中国大陆(CN)   \n",
       "575   2007   576                Chunghwa Telecom/中华电信           中国台湾(TA)   \n",
       "600   2007   601                   China Steel/台湾中钢公司           中国台湾(TA)   \n",
       "603   2007   604            China Merchants Bank/招商银行           中国大陆(CN)   \n",
       "617   2007   617                Nan Ya Plastic/南亚塑胶工业           中国台湾(TA)   \n",
       "627   2007   628                     Cheung Kong/长江集团  中国香港(HK)/中国大陆(CN)   \n",
       "736   2007   737                  Swire Pacific /太古集团  中国香港(HK)/中国大陆(CN)   \n",
       "...    ...   ...                                  ...                ...   \n",
       "1636  2007  1637                        Champion REIT  中国香港(HK)/中国大陆(CN)   \n",
       "1641  2007  1642                          Noble Group  中国香港(HK)/中国大陆(CN)   \n",
       "1661  2007  1662                        Taiwan Mobile           中国台湾(TA)   \n",
       "1681  2007  1682                     Evergreen Marine           中国台湾(TA)   \n",
       "1692  2007  1693              China Southern Airlines           中国大陆(CN)   \n",
       "1705  2007  1706                        Cosco Pacific  中国香港(HK)/中国大陆(CN)   \n",
       "1710  2007  1711             China Shipping Container           中国大陆(CN)   \n",
       "1736  2007  1737       China Resources Power Holdings  中国香港(HK)/中国大陆(CN)   \n",
       "1739  2007  1740                     Citic Securities           中国大陆(CN)   \n",
       "1780  2007  1781                  Far EasTone Telecom           中国台湾(TA)   \n",
       "1786  2007  1787                      E.Sun Financial           中国台湾(TA)   \n",
       "1824  2007  1825                Minmetals Development           中国大陆(CN)   \n",
       "1840  2007  1841                  Shanghai Automotive           中国大陆(CN)   \n",
       "1846  2007  1847              HK Exchanges & Clearing  中国香港(HK)/中国大陆(CN)   \n",
       "1852  2007  1853                            Link REIT  中国香港(HK)/中国大陆(CN)   \n",
       "1860  2007  1861                      Kweichow Moutai           中国大陆(CN)   \n",
       "1892  2007  1892                  Yanzhou Coal Mining           中国大陆(CN)   \n",
       "1908  2007  1909               China Shipping Develop           中国大陆(CN)   \n",
       "1920  2007  1920                       Wing Lung Bank  中国香港(HK)/中国大陆(CN)   \n",
       "1922  2007  1923                    Delta Electronics           中国台湾(TA)   \n",
       "1945  2007  1946                       China Airlines           中国台湾(TA)   \n",
       "1948  2007  1949                       Wing Hang Bank  中国香港(HK)/中国大陆(CN)   \n",
       "1959  2007  1959                                 PCCW  中国香港(HK)/中国大陆(CN)   \n",
       "1960  2007  1961                                 Benq           中国台湾(TA)   \n",
       "1963  2007  1964                             TCL Corp           中国大陆(CN)   \n",
       "1970  2007  1971                      Wuliangye Yibin           中国大陆(CN)   \n",
       "1973  2007  1974                     CNPC (Hong Kong)  中国香港(HK)/中国大陆(CN)   \n",
       "1975  2007  1976                  K Wah International  中国香港(HK)/中国大陆(CN)   \n",
       "1986  2007  1987            China Overseas Land & Inv  中国香港(HK)/中国大陆(CN)   \n",
       "1989  2007  1989          Nine Dragons Paper Holdings  中国香港(HK)/中国大陆(CN)   \n",
       "\n",
       "     Industry_cn  Sales  Profits  Assets  Market_value  \\\n",
       "40            炼油  68.43    16.53   96.42        208.76   \n",
       "52            银行  31.98     4.65  800.04        176.03   \n",
       "68            银行  23.18     5.84  568.21        126.55   \n",
       "70            炼油  99.03     5.07   65.83         93.57   \n",
       "81            银行  23.10     3.41  585.55        143.80   \n",
       "88         电信运营商  29.79     6.56   51.35        185.31   \n",
       "175          多元化  23.55     1.85   74.97         40.57   \n",
       "180        电信运营商  20.98     3.46   50.34         37.50   \n",
       "242           保险  11.18     1.15   69.30        109.96   \n",
       "307           银行   6.64     1.15  176.27         46.14   \n",
       "309          半导体   9.74     3.90   18.02         54.32   \n",
       "340      技术硬件和装备  27.78     1.24   13.99         34.83   \n",
       "365           材料  15.63     1.57   17.59         21.42   \n",
       "388           保险  10.09     0.66   93.29         19.87   \n",
       "394           炼油   8.51     3.10   14.22         34.94   \n",
       "400        电信运营商  10.69     1.70   24.70         15.70   \n",
       "422           材料   6.47     1.94   17.08         45.94   \n",
       "429           银行   4.13     1.74  106.03         25.58   \n",
       "436           炼油  13.56     1.74   12.35         19.28   \n",
       "439           保险   7.95     0.52   39.62         39.60   \n",
       "451         食品市场  11.96     1.25   18.34         13.59   \n",
       "510         综合金融   3.30     2.56   29.72         29.49   \n",
       "541        电信运营商  10.67     0.60   17.63         16.03   \n",
       "551         公用事业   5.87     1.27   16.42         17.65   \n",
       "575        电信运营商   5.59     1.45   13.98         18.22   \n",
       "600           材料   8.66     1.54   10.35         12.24   \n",
       "603           银行   3.53     0.46   90.76         33.19   \n",
       "617         化学制品   7.64     1.22   11.47         13.37   \n",
       "627         综合金融   0.80     1.80   28.01         28.39   \n",
       "736          多元化   2.44     2.42   16.05         17.32   \n",
       "...          ...    ...      ...     ...           ...   \n",
       "1636        综合金融   0.05     1.16    2.95          1.54   \n",
       "1641          运输  13.75     0.13    3.81          2.14   \n",
       "1661       电信运营商   1.81     0.50    3.59          4.84   \n",
       "1681          运输   4.29     0.37    3.96          1.90   \n",
       "1692          运输   4.64    -0.23    8.84          1.97   \n",
       "1705          运输   0.30     0.34    2.85          5.94   \n",
       "1710          运输   3.52     0.44    3.59          2.26   \n",
       "1736        公用事业   0.76     0.37    3.67          5.37   \n",
       "1739        综合金融   0.14     0.04    2.52         14.29   \n",
       "1780       电信运营商   2.19     0.45    3.01          4.45   \n",
       "1786          银行   0.73     0.14   19.36          2.19   \n",
       "1824        贸易公司   8.25     0.04    3.46          1.50   \n",
       "1840       耐用消费品   0.79     0.14    1.81         11.10   \n",
       "1846        综合金融   0.35     0.17    2.96         10.97   \n",
       "1852        综合金融   0.43     0.27    5.24          5.00   \n",
       "1860    食品、饮料和烟草   0.43     0.14    1.00         10.69   \n",
       "1892          材料   1.43     0.36    2.63          4.52   \n",
       "1908          运输   1.06     0.33    1.66          4.61   \n",
       "1920          银行   0.66     0.21   10.92          2.43   \n",
       "1922     技术硬件和装备   2.46     0.23    2.49          6.40   \n",
       "1945          运输   3.61     0.02    7.63          1.85   \n",
       "1948          银行   0.66     0.17   13.45          3.33   \n",
       "1959       电信运营商   2.90     0.21    6.87          3.98   \n",
       "1960     技术硬件和装备   5.39    -0.16    5.04          1.27   \n",
       "1963     技术硬件和装备   6.40    -0.04    3.77          1.39   \n",
       "1970    食品、饮料和烟草   0.70     0.10    1.19          8.81   \n",
       "1973          炼油   0.44     0.47    2.07          2.30   \n",
       "1975        综合金融   0.04     0.47    1.29          0.98   \n",
       "1986        综合金融   0.90     0.20    3.24          7.05   \n",
       "1989          材料   0.99     0.17    1.86          8.61   \n",
       "\n",
       "                          Company_en    Company_cn Country_cn   Country_en  \n",
       "40                       PetroChina           中国石油       中国大陆           CN  \n",
       "52                             ICBC         中国工商银行       中国大陆           CN  \n",
       "68      CCB-China Construction Bank         中国建设银行       中国大陆           CN  \n",
       "70          Sinopec-China Petroleum            中石化       中国大陆           CN  \n",
       "81                    Bank of China           中国银行       中国大陆           CN  \n",
       "88                     China Mobile           中国移动       中国香港  HK)/中国大陆(CN  \n",
       "175                Hutchison Whampoa          和记黄埔       中国香港  HK)/中国大陆(CN  \n",
       "180                    China Telecom          中国电信       中国大陆           CN  \n",
       "242            China Life Insurance           中国人寿       中国大陆           CN  \n",
       "307           Bank of Communications        中国交通银行       中国大陆           CN  \n",
       "309             Taiwan Semiconductor           台积电       中国台湾           TA  \n",
       "340           Hon Hai Precision Ind           鸿海精密       中国台湾           TA  \n",
       "365            Baoshan Iron & Steel         上海宝钢集团       中国大陆           CN  \n",
       "388                 Cathay Financial          国泰金融       中国台湾           TA  \n",
       "394                           Cnooc            中海油       中国香港  HK)/中国大陆(CN  \n",
       "400              China Netcom Group           中国网通       中国香港  HK)/中国大陆(CN  \n",
       "422             China Shenhua Energy  中国神华能源股份有限公司       中国大陆           CN  \n",
       "429                    BOC Hong Kong          中银香港       中国香港  HK)/中国大陆(CN  \n",
       "436            Formosa Petrochemical          台塑石化       中国台湾           TA  \n",
       "439          Ping An Insurance Group          平安保险       中国大陆           CN  \n",
       "451                 Jardine Matheson        香港怡和集团       中国香港  HK)/中国大陆(CN  \n",
       "510         Sun Hung Kai Properties         新鸿基房地产       中国香港  HK)/中国大陆(CN  \n",
       "541                    China Unicom           中国联通       中国香港  HK)/中国大陆(CN  \n",
       "551                    CLP Holdings           中电控股       中国香港  HK)/中国大陆(CN  \n",
       "575                 Chunghwa Telecom          中华电信       中国台湾           TA  \n",
       "600                      China Steel        台湾中钢公司       中国台湾           TA  \n",
       "603             China Merchants Bank          招商银行       中国大陆           CN  \n",
       "617                   Nan Ya Plastic        南亚塑胶工业       中国台湾           TA  \n",
       "627                      Cheung Kong          长江集团       中国香港  HK)/中国大陆(CN  \n",
       "736                   Swire Pacific           太古集团       中国香港  HK)/中国大陆(CN  \n",
       "...                              ...           ...        ...          ...  \n",
       "1636                   Champion REIT           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1641                     Noble Group           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1661                   Taiwan Mobile           NaN       中国台湾           TA  \n",
       "1681                Evergreen Marine           NaN       中国台湾           TA  \n",
       "1692         China Southern Airlines           NaN       中国大陆           CN  \n",
       "1705                   Cosco Pacific           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1710        China Shipping Container           NaN       中国大陆           CN  \n",
       "1736  China Resources Power Holdings           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1739                Citic Securities           NaN       中国大陆           CN  \n",
       "1780             Far EasTone Telecom           NaN       中国台湾           TA  \n",
       "1786                 E.Sun Financial           NaN       中国台湾           TA  \n",
       "1824           Minmetals Development           NaN       中国大陆           CN  \n",
       "1840             Shanghai Automotive           NaN       中国大陆           CN  \n",
       "1846         HK Exchanges & Clearing           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1852                       Link REIT           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1860                 Kweichow Moutai           NaN       中国大陆           CN  \n",
       "1892             Yanzhou Coal Mining           NaN       中国大陆           CN  \n",
       "1908          China Shipping Develop           NaN       中国大陆           CN  \n",
       "1920                  Wing Lung Bank           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1922               Delta Electronics           NaN       中国台湾           TA  \n",
       "1945                  China Airlines           NaN       中国台湾           TA  \n",
       "1948                  Wing Hang Bank           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1959                            PCCW           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1960                            Benq           NaN       中国台湾           TA  \n",
       "1963                        TCL Corp           NaN       中国大陆           CN  \n",
       "1970                 Wuliangye Yibin           NaN       中国大陆           CN  \n",
       "1973                CNPC (Hong Kong)           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1975             K Wah International           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1986       China Overseas Land & Inv           NaN       中国香港  HK)/中国大陆(CN  \n",
       "1989     Nine Dragons Paper Holdings           NaN       中国香港  HK)/中国大陆(CN  \n",
       "\n",
       "[131 rows x 13 columns]"
      ]
     },
     "execution_count": 220,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007[df_2007['Country_cn'].str.contains('中国',regex=True)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 221,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "      <th>Company_en</th>\n",
       "      <th>Company_cn</th>\n",
       "      <th>Country_cn</th>\n",
       "      <th>Country_en</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>2007</td>\n",
       "      <td>41</td>\n",
       "      <td>PetroChina /中国石油</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>68.43</td>\n",
       "      <td>16.53</td>\n",
       "      <td>96.42</td>\n",
       "      <td>208.76</td>\n",
       "      <td>PetroChina</td>\n",
       "      <td>中国石油</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>52</th>\n",
       "      <td>2007</td>\n",
       "      <td>53</td>\n",
       "      <td>ICBC /中国工商银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>31.98</td>\n",
       "      <td>4.65</td>\n",
       "      <td>800.04</td>\n",
       "      <td>176.03</td>\n",
       "      <td>ICBC</td>\n",
       "      <td>中国工商银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>68</th>\n",
       "      <td>2007</td>\n",
       "      <td>69</td>\n",
       "      <td>CCB-China Construction Bank /中国建设银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>23.18</td>\n",
       "      <td>5.84</td>\n",
       "      <td>568.21</td>\n",
       "      <td>126.55</td>\n",
       "      <td>CCB-China Construction Bank</td>\n",
       "      <td>中国建设银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>2007</td>\n",
       "      <td>71</td>\n",
       "      <td>Sinopec-China Petroleum /中石化</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>99.03</td>\n",
       "      <td>5.07</td>\n",
       "      <td>65.83</td>\n",
       "      <td>93.57</td>\n",
       "      <td>Sinopec-China Petroleum</td>\n",
       "      <td>中石化</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>81</th>\n",
       "      <td>2007</td>\n",
       "      <td>82</td>\n",
       "      <td>Bank of China /中国银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>23.10</td>\n",
       "      <td>3.41</td>\n",
       "      <td>585.55</td>\n",
       "      <td>143.80</td>\n",
       "      <td>Bank of China</td>\n",
       "      <td>中国银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>88</th>\n",
       "      <td>2007</td>\n",
       "      <td>89</td>\n",
       "      <td>China Mobile /中国移动</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>29.79</td>\n",
       "      <td>6.56</td>\n",
       "      <td>51.35</td>\n",
       "      <td>185.31</td>\n",
       "      <td>China Mobile</td>\n",
       "      <td>中国移动</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>175</th>\n",
       "      <td>2007</td>\n",
       "      <td>176</td>\n",
       "      <td>Hutchison Whampoa/和记黄埔</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>多元化</td>\n",
       "      <td>23.55</td>\n",
       "      <td>1.85</td>\n",
       "      <td>74.97</td>\n",
       "      <td>40.57</td>\n",
       "      <td>Hutchison Whampoa</td>\n",
       "      <td>和记黄埔</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>180</th>\n",
       "      <td>2007</td>\n",
       "      <td>181</td>\n",
       "      <td>China Telecom/中国电信</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>20.98</td>\n",
       "      <td>3.46</td>\n",
       "      <td>50.34</td>\n",
       "      <td>37.50</td>\n",
       "      <td>China Telecom</td>\n",
       "      <td>中国电信</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>242</th>\n",
       "      <td>2007</td>\n",
       "      <td>243</td>\n",
       "      <td>China Life Insurance /中国人寿</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>保险</td>\n",
       "      <td>11.18</td>\n",
       "      <td>1.15</td>\n",
       "      <td>69.30</td>\n",
       "      <td>109.96</td>\n",
       "      <td>China Life Insurance</td>\n",
       "      <td>中国人寿</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>307</th>\n",
       "      <td>2007</td>\n",
       "      <td>308</td>\n",
       "      <td>Bank of Communications/中国交通银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>6.64</td>\n",
       "      <td>1.15</td>\n",
       "      <td>176.27</td>\n",
       "      <td>46.14</td>\n",
       "      <td>Bank of Communications</td>\n",
       "      <td>中国交通银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>309</th>\n",
       "      <td>2007</td>\n",
       "      <td>310</td>\n",
       "      <td>Taiwan Semiconductor/台积电</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>半导体</td>\n",
       "      <td>9.74</td>\n",
       "      <td>3.90</td>\n",
       "      <td>18.02</td>\n",
       "      <td>54.32</td>\n",
       "      <td>Taiwan Semiconductor</td>\n",
       "      <td>台积电</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>340</th>\n",
       "      <td>2007</td>\n",
       "      <td>341</td>\n",
       "      <td>Hon Hai Precision Ind /鸿海精密</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>27.78</td>\n",
       "      <td>1.24</td>\n",
       "      <td>13.99</td>\n",
       "      <td>34.83</td>\n",
       "      <td>Hon Hai Precision Ind</td>\n",
       "      <td>鸿海精密</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>365</th>\n",
       "      <td>2007</td>\n",
       "      <td>366</td>\n",
       "      <td>Baoshan Iron &amp; Steel /上海宝钢集团</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>15.63</td>\n",
       "      <td>1.57</td>\n",
       "      <td>17.59</td>\n",
       "      <td>21.42</td>\n",
       "      <td>Baoshan Iron &amp; Steel</td>\n",
       "      <td>上海宝钢集团</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>388</th>\n",
       "      <td>2007</td>\n",
       "      <td>389</td>\n",
       "      <td>Cathay Financial/国泰金融</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>保险</td>\n",
       "      <td>10.09</td>\n",
       "      <td>0.66</td>\n",
       "      <td>93.29</td>\n",
       "      <td>19.87</td>\n",
       "      <td>Cathay Financial</td>\n",
       "      <td>国泰金融</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>394</th>\n",
       "      <td>2007</td>\n",
       "      <td>395</td>\n",
       "      <td>Cnooc /中海油</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>8.51</td>\n",
       "      <td>3.10</td>\n",
       "      <td>14.22</td>\n",
       "      <td>34.94</td>\n",
       "      <td>Cnooc</td>\n",
       "      <td>中海油</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>400</th>\n",
       "      <td>2007</td>\n",
       "      <td>401</td>\n",
       "      <td>China Netcom Group /中国网通</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>10.69</td>\n",
       "      <td>1.70</td>\n",
       "      <td>24.70</td>\n",
       "      <td>15.70</td>\n",
       "      <td>China Netcom Group</td>\n",
       "      <td>中国网通</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>422</th>\n",
       "      <td>2007</td>\n",
       "      <td>423</td>\n",
       "      <td>China Shenhua Energy/中国神华能源股份有限公司</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>6.47</td>\n",
       "      <td>1.94</td>\n",
       "      <td>17.08</td>\n",
       "      <td>45.94</td>\n",
       "      <td>China Shenhua Energy</td>\n",
       "      <td>中国神华能源股份有限公司</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>429</th>\n",
       "      <td>2007</td>\n",
       "      <td>430</td>\n",
       "      <td>BOC Hong Kong/中银香港</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>4.13</td>\n",
       "      <td>1.74</td>\n",
       "      <td>106.03</td>\n",
       "      <td>25.58</td>\n",
       "      <td>BOC Hong Kong</td>\n",
       "      <td>中银香港</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>436</th>\n",
       "      <td>2007</td>\n",
       "      <td>437</td>\n",
       "      <td>Formosa Petrochemical/台塑石化</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>13.56</td>\n",
       "      <td>1.74</td>\n",
       "      <td>12.35</td>\n",
       "      <td>19.28</td>\n",
       "      <td>Formosa Petrochemical</td>\n",
       "      <td>台塑石化</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>439</th>\n",
       "      <td>2007</td>\n",
       "      <td>440</td>\n",
       "      <td>Ping An Insurance Group/平安保险</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>保险</td>\n",
       "      <td>7.95</td>\n",
       "      <td>0.52</td>\n",
       "      <td>39.62</td>\n",
       "      <td>39.60</td>\n",
       "      <td>Ping An Insurance Group</td>\n",
       "      <td>平安保险</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>451</th>\n",
       "      <td>2007</td>\n",
       "      <td>452</td>\n",
       "      <td>Jardine Matheson/香港怡和集团</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>食品市场</td>\n",
       "      <td>11.96</td>\n",
       "      <td>1.25</td>\n",
       "      <td>18.34</td>\n",
       "      <td>13.59</td>\n",
       "      <td>Jardine Matheson</td>\n",
       "      <td>香港怡和集团</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>510</th>\n",
       "      <td>2007</td>\n",
       "      <td>511</td>\n",
       "      <td>Sun Hung Kai Properties /新鸿基房地产</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>3.30</td>\n",
       "      <td>2.56</td>\n",
       "      <td>29.72</td>\n",
       "      <td>29.49</td>\n",
       "      <td>Sun Hung Kai Properties</td>\n",
       "      <td>新鸿基房地产</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>541</th>\n",
       "      <td>2007</td>\n",
       "      <td>542</td>\n",
       "      <td>China Unicom /中国联通</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>10.67</td>\n",
       "      <td>0.60</td>\n",
       "      <td>17.63</td>\n",
       "      <td>16.03</td>\n",
       "      <td>China Unicom</td>\n",
       "      <td>中国联通</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>551</th>\n",
       "      <td>2007</td>\n",
       "      <td>552</td>\n",
       "      <td>CLP Holdings /中电控股</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>公用事业</td>\n",
       "      <td>5.87</td>\n",
       "      <td>1.27</td>\n",
       "      <td>16.42</td>\n",
       "      <td>17.65</td>\n",
       "      <td>CLP Holdings</td>\n",
       "      <td>中电控股</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>575</th>\n",
       "      <td>2007</td>\n",
       "      <td>576</td>\n",
       "      <td>Chunghwa Telecom/中华电信</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>5.59</td>\n",
       "      <td>1.45</td>\n",
       "      <td>13.98</td>\n",
       "      <td>18.22</td>\n",
       "      <td>Chunghwa Telecom</td>\n",
       "      <td>中华电信</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>600</th>\n",
       "      <td>2007</td>\n",
       "      <td>601</td>\n",
       "      <td>China Steel/台湾中钢公司</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>材料</td>\n",
       "      <td>8.66</td>\n",
       "      <td>1.54</td>\n",
       "      <td>10.35</td>\n",
       "      <td>12.24</td>\n",
       "      <td>China Steel</td>\n",
       "      <td>台湾中钢公司</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>603</th>\n",
       "      <td>2007</td>\n",
       "      <td>604</td>\n",
       "      <td>China Merchants Bank/招商银行</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>3.53</td>\n",
       "      <td>0.46</td>\n",
       "      <td>90.76</td>\n",
       "      <td>33.19</td>\n",
       "      <td>China Merchants Bank</td>\n",
       "      <td>招商银行</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>617</th>\n",
       "      <td>2007</td>\n",
       "      <td>617</td>\n",
       "      <td>Nan Ya Plastic/南亚塑胶工业</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>化学制品</td>\n",
       "      <td>7.64</td>\n",
       "      <td>1.22</td>\n",
       "      <td>11.47</td>\n",
       "      <td>13.37</td>\n",
       "      <td>Nan Ya Plastic</td>\n",
       "      <td>南亚塑胶工业</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>627</th>\n",
       "      <td>2007</td>\n",
       "      <td>628</td>\n",
       "      <td>Cheung Kong/长江集团</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.80</td>\n",
       "      <td>1.80</td>\n",
       "      <td>28.01</td>\n",
       "      <td>28.39</td>\n",
       "      <td>Cheung Kong</td>\n",
       "      <td>长江集团</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>736</th>\n",
       "      <td>2007</td>\n",
       "      <td>737</td>\n",
       "      <td>Swire Pacific /太古集团</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>多元化</td>\n",
       "      <td>2.44</td>\n",
       "      <td>2.42</td>\n",
       "      <td>16.05</td>\n",
       "      <td>17.32</td>\n",
       "      <td>Swire Pacific</td>\n",
       "      <td>太古集团</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1636</th>\n",
       "      <td>2007</td>\n",
       "      <td>1637</td>\n",
       "      <td>Champion REIT</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.05</td>\n",
       "      <td>1.16</td>\n",
       "      <td>2.95</td>\n",
       "      <td>1.54</td>\n",
       "      <td>Champion REIT</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1641</th>\n",
       "      <td>2007</td>\n",
       "      <td>1642</td>\n",
       "      <td>Noble Group</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>13.75</td>\n",
       "      <td>0.13</td>\n",
       "      <td>3.81</td>\n",
       "      <td>2.14</td>\n",
       "      <td>Noble Group</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1661</th>\n",
       "      <td>2007</td>\n",
       "      <td>1662</td>\n",
       "      <td>Taiwan Mobile</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>1.81</td>\n",
       "      <td>0.50</td>\n",
       "      <td>3.59</td>\n",
       "      <td>4.84</td>\n",
       "      <td>Taiwan Mobile</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1681</th>\n",
       "      <td>2007</td>\n",
       "      <td>1682</td>\n",
       "      <td>Evergreen Marine</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>运输</td>\n",
       "      <td>4.29</td>\n",
       "      <td>0.37</td>\n",
       "      <td>3.96</td>\n",
       "      <td>1.90</td>\n",
       "      <td>Evergreen Marine</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1692</th>\n",
       "      <td>2007</td>\n",
       "      <td>1693</td>\n",
       "      <td>China Southern Airlines</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>4.64</td>\n",
       "      <td>-0.23</td>\n",
       "      <td>8.84</td>\n",
       "      <td>1.97</td>\n",
       "      <td>China Southern Airlines</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1705</th>\n",
       "      <td>2007</td>\n",
       "      <td>1706</td>\n",
       "      <td>Cosco Pacific</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>0.30</td>\n",
       "      <td>0.34</td>\n",
       "      <td>2.85</td>\n",
       "      <td>5.94</td>\n",
       "      <td>Cosco Pacific</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1710</th>\n",
       "      <td>2007</td>\n",
       "      <td>1711</td>\n",
       "      <td>China Shipping Container</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>3.52</td>\n",
       "      <td>0.44</td>\n",
       "      <td>3.59</td>\n",
       "      <td>2.26</td>\n",
       "      <td>China Shipping Container</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1736</th>\n",
       "      <td>2007</td>\n",
       "      <td>1737</td>\n",
       "      <td>China Resources Power Holdings</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>公用事业</td>\n",
       "      <td>0.76</td>\n",
       "      <td>0.37</td>\n",
       "      <td>3.67</td>\n",
       "      <td>5.37</td>\n",
       "      <td>China Resources Power Holdings</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1739</th>\n",
       "      <td>2007</td>\n",
       "      <td>1740</td>\n",
       "      <td>Citic Securities</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.14</td>\n",
       "      <td>0.04</td>\n",
       "      <td>2.52</td>\n",
       "      <td>14.29</td>\n",
       "      <td>Citic Securities</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1780</th>\n",
       "      <td>2007</td>\n",
       "      <td>1781</td>\n",
       "      <td>Far EasTone Telecom</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>2.19</td>\n",
       "      <td>0.45</td>\n",
       "      <td>3.01</td>\n",
       "      <td>4.45</td>\n",
       "      <td>Far EasTone Telecom</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1786</th>\n",
       "      <td>2007</td>\n",
       "      <td>1787</td>\n",
       "      <td>E.Sun Financial</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.73</td>\n",
       "      <td>0.14</td>\n",
       "      <td>19.36</td>\n",
       "      <td>2.19</td>\n",
       "      <td>E.Sun Financial</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1824</th>\n",
       "      <td>2007</td>\n",
       "      <td>1825</td>\n",
       "      <td>Minmetals Development</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>贸易公司</td>\n",
       "      <td>8.25</td>\n",
       "      <td>0.04</td>\n",
       "      <td>3.46</td>\n",
       "      <td>1.50</td>\n",
       "      <td>Minmetals Development</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1840</th>\n",
       "      <td>2007</td>\n",
       "      <td>1841</td>\n",
       "      <td>Shanghai Automotive</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>耐用消费品</td>\n",
       "      <td>0.79</td>\n",
       "      <td>0.14</td>\n",
       "      <td>1.81</td>\n",
       "      <td>11.10</td>\n",
       "      <td>Shanghai Automotive</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1846</th>\n",
       "      <td>2007</td>\n",
       "      <td>1847</td>\n",
       "      <td>HK Exchanges &amp; Clearing</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.35</td>\n",
       "      <td>0.17</td>\n",
       "      <td>2.96</td>\n",
       "      <td>10.97</td>\n",
       "      <td>HK Exchanges &amp; Clearing</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1852</th>\n",
       "      <td>2007</td>\n",
       "      <td>1853</td>\n",
       "      <td>Link REIT</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.43</td>\n",
       "      <td>0.27</td>\n",
       "      <td>5.24</td>\n",
       "      <td>5.00</td>\n",
       "      <td>Link REIT</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1860</th>\n",
       "      <td>2007</td>\n",
       "      <td>1861</td>\n",
       "      <td>Kweichow Moutai</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>0.43</td>\n",
       "      <td>0.14</td>\n",
       "      <td>1.00</td>\n",
       "      <td>10.69</td>\n",
       "      <td>Kweichow Moutai</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1892</th>\n",
       "      <td>2007</td>\n",
       "      <td>1892</td>\n",
       "      <td>Yanzhou Coal Mining</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>1.43</td>\n",
       "      <td>0.36</td>\n",
       "      <td>2.63</td>\n",
       "      <td>4.52</td>\n",
       "      <td>Yanzhou Coal Mining</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1908</th>\n",
       "      <td>2007</td>\n",
       "      <td>1909</td>\n",
       "      <td>China Shipping Develop</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>运输</td>\n",
       "      <td>1.06</td>\n",
       "      <td>0.33</td>\n",
       "      <td>1.66</td>\n",
       "      <td>4.61</td>\n",
       "      <td>China Shipping Develop</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1920</th>\n",
       "      <td>2007</td>\n",
       "      <td>1920</td>\n",
       "      <td>Wing Lung Bank</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.66</td>\n",
       "      <td>0.21</td>\n",
       "      <td>10.92</td>\n",
       "      <td>2.43</td>\n",
       "      <td>Wing Lung Bank</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1922</th>\n",
       "      <td>2007</td>\n",
       "      <td>1923</td>\n",
       "      <td>Delta Electronics</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>2.46</td>\n",
       "      <td>0.23</td>\n",
       "      <td>2.49</td>\n",
       "      <td>6.40</td>\n",
       "      <td>Delta Electronics</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1945</th>\n",
       "      <td>2007</td>\n",
       "      <td>1946</td>\n",
       "      <td>China Airlines</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>运输</td>\n",
       "      <td>3.61</td>\n",
       "      <td>0.02</td>\n",
       "      <td>7.63</td>\n",
       "      <td>1.85</td>\n",
       "      <td>China Airlines</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1948</th>\n",
       "      <td>2007</td>\n",
       "      <td>1949</td>\n",
       "      <td>Wing Hang Bank</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.66</td>\n",
       "      <td>0.17</td>\n",
       "      <td>13.45</td>\n",
       "      <td>3.33</td>\n",
       "      <td>Wing Hang Bank</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1959</th>\n",
       "      <td>2007</td>\n",
       "      <td>1959</td>\n",
       "      <td>PCCW</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>电信运营商</td>\n",
       "      <td>2.90</td>\n",
       "      <td>0.21</td>\n",
       "      <td>6.87</td>\n",
       "      <td>3.98</td>\n",
       "      <td>PCCW</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1960</th>\n",
       "      <td>2007</td>\n",
       "      <td>1961</td>\n",
       "      <td>Benq</td>\n",
       "      <td>中国台湾(TA)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>5.39</td>\n",
       "      <td>-0.16</td>\n",
       "      <td>5.04</td>\n",
       "      <td>1.27</td>\n",
       "      <td>Benq</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国台湾</td>\n",
       "      <td>CN-TA</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1963</th>\n",
       "      <td>2007</td>\n",
       "      <td>1964</td>\n",
       "      <td>TCL Corp</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>技术硬件和装备</td>\n",
       "      <td>6.40</td>\n",
       "      <td>-0.04</td>\n",
       "      <td>3.77</td>\n",
       "      <td>1.39</td>\n",
       "      <td>TCL Corp</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1970</th>\n",
       "      <td>2007</td>\n",
       "      <td>1971</td>\n",
       "      <td>Wuliangye Yibin</td>\n",
       "      <td>中国大陆(CN)</td>\n",
       "      <td>食品、饮料和烟草</td>\n",
       "      <td>0.70</td>\n",
       "      <td>0.10</td>\n",
       "      <td>1.19</td>\n",
       "      <td>8.81</td>\n",
       "      <td>Wuliangye Yibin</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>CN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1973</th>\n",
       "      <td>2007</td>\n",
       "      <td>1974</td>\n",
       "      <td>CNPC (Hong Kong)</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>0.44</td>\n",
       "      <td>0.47</td>\n",
       "      <td>2.07</td>\n",
       "      <td>2.30</td>\n",
       "      <td>CNPC (Hong Kong)</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1975</th>\n",
       "      <td>2007</td>\n",
       "      <td>1976</td>\n",
       "      <td>K Wah International</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.04</td>\n",
       "      <td>0.47</td>\n",
       "      <td>1.29</td>\n",
       "      <td>0.98</td>\n",
       "      <td>K Wah International</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1986</th>\n",
       "      <td>2007</td>\n",
       "      <td>1987</td>\n",
       "      <td>China Overseas Land &amp; Inv</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.90</td>\n",
       "      <td>0.20</td>\n",
       "      <td>3.24</td>\n",
       "      <td>7.05</td>\n",
       "      <td>China Overseas Land &amp; Inv</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1989</th>\n",
       "      <td>2007</td>\n",
       "      <td>1989</td>\n",
       "      <td>Nine Dragons Paper Holdings</td>\n",
       "      <td>中国香港(HK)/中国大陆(CN)</td>\n",
       "      <td>材料</td>\n",
       "      <td>0.99</td>\n",
       "      <td>0.17</td>\n",
       "      <td>1.86</td>\n",
       "      <td>8.61</td>\n",
       "      <td>Nine Dragons Paper Holdings</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>CN-HK</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>131 rows × 13 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      Year  Rank                        Company_cn_en      Country_cn_en  \\\n",
       "40    2007    41                     PetroChina /中国石油           中国大陆(CN)   \n",
       "52    2007    53                         ICBC /中国工商银行           中国大陆(CN)   \n",
       "68    2007    69  CCB-China Construction Bank /中国建设银行           中国大陆(CN)   \n",
       "70    2007    71         Sinopec-China Petroleum /中石化           中国大陆(CN)   \n",
       "81    2007    82                  Bank of China /中国银行           中国大陆(CN)   \n",
       "88    2007    89                   China Mobile /中国移动  中国香港(HK)/中国大陆(CN)   \n",
       "175   2007   176               Hutchison Whampoa/和记黄埔  中国香港(HK)/中国大陆(CN)   \n",
       "180   2007   181                   China Telecom/中国电信           中国大陆(CN)   \n",
       "242   2007   243           China Life Insurance /中国人寿           中国大陆(CN)   \n",
       "307   2007   308        Bank of Communications/中国交通银行           中国大陆(CN)   \n",
       "309   2007   310             Taiwan Semiconductor/台积电           中国台湾(TA)   \n",
       "340   2007   341          Hon Hai Precision Ind /鸿海精密           中国台湾(TA)   \n",
       "365   2007   366         Baoshan Iron & Steel /上海宝钢集团           中国大陆(CN)   \n",
       "388   2007   389                Cathay Financial/国泰金融           中国台湾(TA)   \n",
       "394   2007   395                           Cnooc /中海油  中国香港(HK)/中国大陆(CN)   \n",
       "400   2007   401             China Netcom Group /中国网通  中国香港(HK)/中国大陆(CN)   \n",
       "422   2007   423    China Shenhua Energy/中国神华能源股份有限公司           中国大陆(CN)   \n",
       "429   2007   430                   BOC Hong Kong/中银香港  中国香港(HK)/中国大陆(CN)   \n",
       "436   2007   437           Formosa Petrochemical/台塑石化           中国台湾(TA)   \n",
       "439   2007   440         Ping An Insurance Group/平安保险           中国大陆(CN)   \n",
       "451   2007   452              Jardine Matheson/香港怡和集团  中国香港(HK)/中国大陆(CN)   \n",
       "510   2007   511      Sun Hung Kai Properties /新鸿基房地产  中国香港(HK)/中国大陆(CN)   \n",
       "541   2007   542                   China Unicom /中国联通  中国香港(HK)/中国大陆(CN)   \n",
       "551   2007   552                   CLP Holdings /中电控股  中国香港(HK)/中国大陆(CN)   \n",
       "575   2007   576                Chunghwa Telecom/中华电信           中国台湾(TA)   \n",
       "600   2007   601                   China Steel/台湾中钢公司           中国台湾(TA)   \n",
       "603   2007   604            China Merchants Bank/招商银行           中国大陆(CN)   \n",
       "617   2007   617                Nan Ya Plastic/南亚塑胶工业           中国台湾(TA)   \n",
       "627   2007   628                     Cheung Kong/长江集团  中国香港(HK)/中国大陆(CN)   \n",
       "736   2007   737                  Swire Pacific /太古集团  中国香港(HK)/中国大陆(CN)   \n",
       "...    ...   ...                                  ...                ...   \n",
       "1636  2007  1637                        Champion REIT  中国香港(HK)/中国大陆(CN)   \n",
       "1641  2007  1642                          Noble Group  中国香港(HK)/中国大陆(CN)   \n",
       "1661  2007  1662                        Taiwan Mobile           中国台湾(TA)   \n",
       "1681  2007  1682                     Evergreen Marine           中国台湾(TA)   \n",
       "1692  2007  1693              China Southern Airlines           中国大陆(CN)   \n",
       "1705  2007  1706                        Cosco Pacific  中国香港(HK)/中国大陆(CN)   \n",
       "1710  2007  1711             China Shipping Container           中国大陆(CN)   \n",
       "1736  2007  1737       China Resources Power Holdings  中国香港(HK)/中国大陆(CN)   \n",
       "1739  2007  1740                     Citic Securities           中国大陆(CN)   \n",
       "1780  2007  1781                  Far EasTone Telecom           中国台湾(TA)   \n",
       "1786  2007  1787                      E.Sun Financial           中国台湾(TA)   \n",
       "1824  2007  1825                Minmetals Development           中国大陆(CN)   \n",
       "1840  2007  1841                  Shanghai Automotive           中国大陆(CN)   \n",
       "1846  2007  1847              HK Exchanges & Clearing  中国香港(HK)/中国大陆(CN)   \n",
       "1852  2007  1853                            Link REIT  中国香港(HK)/中国大陆(CN)   \n",
       "1860  2007  1861                      Kweichow Moutai           中国大陆(CN)   \n",
       "1892  2007  1892                  Yanzhou Coal Mining           中国大陆(CN)   \n",
       "1908  2007  1909               China Shipping Develop           中国大陆(CN)   \n",
       "1920  2007  1920                       Wing Lung Bank  中国香港(HK)/中国大陆(CN)   \n",
       "1922  2007  1923                    Delta Electronics           中国台湾(TA)   \n",
       "1945  2007  1946                       China Airlines           中国台湾(TA)   \n",
       "1948  2007  1949                       Wing Hang Bank  中国香港(HK)/中国大陆(CN)   \n",
       "1959  2007  1959                                 PCCW  中国香港(HK)/中国大陆(CN)   \n",
       "1960  2007  1961                                 Benq           中国台湾(TA)   \n",
       "1963  2007  1964                             TCL Corp           中国大陆(CN)   \n",
       "1970  2007  1971                      Wuliangye Yibin           中国大陆(CN)   \n",
       "1973  2007  1974                     CNPC (Hong Kong)  中国香港(HK)/中国大陆(CN)   \n",
       "1975  2007  1976                  K Wah International  中国香港(HK)/中国大陆(CN)   \n",
       "1986  2007  1987            China Overseas Land & Inv  中国香港(HK)/中国大陆(CN)   \n",
       "1989  2007  1989          Nine Dragons Paper Holdings  中国香港(HK)/中国大陆(CN)   \n",
       "\n",
       "     Industry_cn  Sales  Profits  Assets  Market_value  \\\n",
       "40            炼油  68.43    16.53   96.42        208.76   \n",
       "52            银行  31.98     4.65  800.04        176.03   \n",
       "68            银行  23.18     5.84  568.21        126.55   \n",
       "70            炼油  99.03     5.07   65.83         93.57   \n",
       "81            银行  23.10     3.41  585.55        143.80   \n",
       "88         电信运营商  29.79     6.56   51.35        185.31   \n",
       "175          多元化  23.55     1.85   74.97         40.57   \n",
       "180        电信运营商  20.98     3.46   50.34         37.50   \n",
       "242           保险  11.18     1.15   69.30        109.96   \n",
       "307           银行   6.64     1.15  176.27         46.14   \n",
       "309          半导体   9.74     3.90   18.02         54.32   \n",
       "340      技术硬件和装备  27.78     1.24   13.99         34.83   \n",
       "365           材料  15.63     1.57   17.59         21.42   \n",
       "388           保险  10.09     0.66   93.29         19.87   \n",
       "394           炼油   8.51     3.10   14.22         34.94   \n",
       "400        电信运营商  10.69     1.70   24.70         15.70   \n",
       "422           材料   6.47     1.94   17.08         45.94   \n",
       "429           银行   4.13     1.74  106.03         25.58   \n",
       "436           炼油  13.56     1.74   12.35         19.28   \n",
       "439           保险   7.95     0.52   39.62         39.60   \n",
       "451         食品市场  11.96     1.25   18.34         13.59   \n",
       "510         综合金融   3.30     2.56   29.72         29.49   \n",
       "541        电信运营商  10.67     0.60   17.63         16.03   \n",
       "551         公用事业   5.87     1.27   16.42         17.65   \n",
       "575        电信运营商   5.59     1.45   13.98         18.22   \n",
       "600           材料   8.66     1.54   10.35         12.24   \n",
       "603           银行   3.53     0.46   90.76         33.19   \n",
       "617         化学制品   7.64     1.22   11.47         13.37   \n",
       "627         综合金融   0.80     1.80   28.01         28.39   \n",
       "736          多元化   2.44     2.42   16.05         17.32   \n",
       "...          ...    ...      ...     ...           ...   \n",
       "1636        综合金融   0.05     1.16    2.95          1.54   \n",
       "1641          运输  13.75     0.13    3.81          2.14   \n",
       "1661       电信运营商   1.81     0.50    3.59          4.84   \n",
       "1681          运输   4.29     0.37    3.96          1.90   \n",
       "1692          运输   4.64    -0.23    8.84          1.97   \n",
       "1705          运输   0.30     0.34    2.85          5.94   \n",
       "1710          运输   3.52     0.44    3.59          2.26   \n",
       "1736        公用事业   0.76     0.37    3.67          5.37   \n",
       "1739        综合金融   0.14     0.04    2.52         14.29   \n",
       "1780       电信运营商   2.19     0.45    3.01          4.45   \n",
       "1786          银行   0.73     0.14   19.36          2.19   \n",
       "1824        贸易公司   8.25     0.04    3.46          1.50   \n",
       "1840       耐用消费品   0.79     0.14    1.81         11.10   \n",
       "1846        综合金融   0.35     0.17    2.96         10.97   \n",
       "1852        综合金融   0.43     0.27    5.24          5.00   \n",
       "1860    食品、饮料和烟草   0.43     0.14    1.00         10.69   \n",
       "1892          材料   1.43     0.36    2.63          4.52   \n",
       "1908          运输   1.06     0.33    1.66          4.61   \n",
       "1920          银行   0.66     0.21   10.92          2.43   \n",
       "1922     技术硬件和装备   2.46     0.23    2.49          6.40   \n",
       "1945          运输   3.61     0.02    7.63          1.85   \n",
       "1948          银行   0.66     0.17   13.45          3.33   \n",
       "1959       电信运营商   2.90     0.21    6.87          3.98   \n",
       "1960     技术硬件和装备   5.39    -0.16    5.04          1.27   \n",
       "1963     技术硬件和装备   6.40    -0.04    3.77          1.39   \n",
       "1970    食品、饮料和烟草   0.70     0.10    1.19          8.81   \n",
       "1973          炼油   0.44     0.47    2.07          2.30   \n",
       "1975        综合金融   0.04     0.47    1.29          0.98   \n",
       "1986        综合金融   0.90     0.20    3.24          7.05   \n",
       "1989          材料   0.99     0.17    1.86          8.61   \n",
       "\n",
       "                          Company_en    Company_cn Country_cn Country_en  \n",
       "40                       PetroChina           中国石油       中国大陆         CN  \n",
       "52                             ICBC         中国工商银行       中国大陆         CN  \n",
       "68      CCB-China Construction Bank         中国建设银行       中国大陆         CN  \n",
       "70          Sinopec-China Petroleum            中石化       中国大陆         CN  \n",
       "81                    Bank of China           中国银行       中国大陆         CN  \n",
       "88                     China Mobile           中国移动       中国香港      CN-HK  \n",
       "175                Hutchison Whampoa          和记黄埔       中国香港      CN-HK  \n",
       "180                    China Telecom          中国电信       中国大陆         CN  \n",
       "242            China Life Insurance           中国人寿       中国大陆         CN  \n",
       "307           Bank of Communications        中国交通银行       中国大陆         CN  \n",
       "309             Taiwan Semiconductor           台积电       中国台湾      CN-TA  \n",
       "340           Hon Hai Precision Ind           鸿海精密       中国台湾      CN-TA  \n",
       "365            Baoshan Iron & Steel         上海宝钢集团       中国大陆         CN  \n",
       "388                 Cathay Financial          国泰金融       中国台湾      CN-TA  \n",
       "394                           Cnooc            中海油       中国香港      CN-HK  \n",
       "400              China Netcom Group           中国网通       中国香港      CN-HK  \n",
       "422             China Shenhua Energy  中国神华能源股份有限公司       中国大陆         CN  \n",
       "429                    BOC Hong Kong          中银香港       中国香港      CN-HK  \n",
       "436            Formosa Petrochemical          台塑石化       中国台湾      CN-TA  \n",
       "439          Ping An Insurance Group          平安保险       中国大陆         CN  \n",
       "451                 Jardine Matheson        香港怡和集团       中国香港      CN-HK  \n",
       "510         Sun Hung Kai Properties         新鸿基房地产       中国香港      CN-HK  \n",
       "541                    China Unicom           中国联通       中国香港      CN-HK  \n",
       "551                    CLP Holdings           中电控股       中国香港      CN-HK  \n",
       "575                 Chunghwa Telecom          中华电信       中国台湾      CN-TA  \n",
       "600                      China Steel        台湾中钢公司       中国台湾      CN-TA  \n",
       "603             China Merchants Bank          招商银行       中国大陆         CN  \n",
       "617                   Nan Ya Plastic        南亚塑胶工业       中国台湾      CN-TA  \n",
       "627                      Cheung Kong          长江集团       中国香港      CN-HK  \n",
       "736                   Swire Pacific           太古集团       中国香港      CN-HK  \n",
       "...                              ...           ...        ...        ...  \n",
       "1636                   Champion REIT           NaN       中国香港      CN-HK  \n",
       "1641                     Noble Group           NaN       中国香港      CN-HK  \n",
       "1661                   Taiwan Mobile           NaN       中国台湾      CN-TA  \n",
       "1681                Evergreen Marine           NaN       中国台湾      CN-TA  \n",
       "1692         China Southern Airlines           NaN       中国大陆         CN  \n",
       "1705                   Cosco Pacific           NaN       中国香港      CN-HK  \n",
       "1710        China Shipping Container           NaN       中国大陆         CN  \n",
       "1736  China Resources Power Holdings           NaN       中国香港      CN-HK  \n",
       "1739                Citic Securities           NaN       中国大陆         CN  \n",
       "1780             Far EasTone Telecom           NaN       中国台湾      CN-TA  \n",
       "1786                 E.Sun Financial           NaN       中国台湾      CN-TA  \n",
       "1824           Minmetals Development           NaN       中国大陆         CN  \n",
       "1840             Shanghai Automotive           NaN       中国大陆         CN  \n",
       "1846         HK Exchanges & Clearing           NaN       中国香港      CN-HK  \n",
       "1852                       Link REIT           NaN       中国香港      CN-HK  \n",
       "1860                 Kweichow Moutai           NaN       中国大陆         CN  \n",
       "1892             Yanzhou Coal Mining           NaN       中国大陆         CN  \n",
       "1908          China Shipping Develop           NaN       中国大陆         CN  \n",
       "1920                  Wing Lung Bank           NaN       中国香港      CN-HK  \n",
       "1922               Delta Electronics           NaN       中国台湾      CN-TA  \n",
       "1945                  China Airlines           NaN       中国台湾      CN-TA  \n",
       "1948                  Wing Hang Bank           NaN       中国香港      CN-HK  \n",
       "1959                            PCCW           NaN       中国香港      CN-HK  \n",
       "1960                            Benq           NaN       中国台湾      CN-TA  \n",
       "1963                        TCL Corp           NaN       中国大陆         CN  \n",
       "1970                 Wuliangye Yibin           NaN       中国大陆         CN  \n",
       "1973                CNPC (Hong Kong)           NaN       中国香港      CN-HK  \n",
       "1975             K Wah International           NaN       中国香港      CN-HK  \n",
       "1986       China Overseas Land & Inv           NaN       中国香港      CN-HK  \n",
       "1989     Nine Dragons Paper Holdings           NaN       中国香港      CN-HK  \n",
       "\n",
       "[131 rows x 13 columns]"
      ]
     },
     "execution_count": 221,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007['Country_en'] = df_2007['Country_en'].replace(['HK.*','TA'],['CN-HK', 'CN-TA'],regex=True)\n",
    "df_2007[df_2007['Country_en'].str.contains('CN',regex=True)]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 考虑到其他年份，公司所在行业有用英文名称展示的，这里添加一列英文的行业名称，但内容是空白"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 222,
   "metadata": {
    "collapsed": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "      <th>Company_en</th>\n",
       "      <th>Company_cn</th>\n",
       "      <th>Country_cn</th>\n",
       "      <th>Country_en</th>\n",
       "      <th>Industry_en</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1995</th>\n",
       "      <td>2007</td>\n",
       "      <td>1995</td>\n",
       "      <td>Fremont General</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>1.25</td>\n",
       "      <td>0.17</td>\n",
       "      <td>12.80</td>\n",
       "      <td>0.69</td>\n",
       "      <td>Fremont General</td>\n",
       "      <td>NaN</td>\n",
       "      <td>美国</td>\n",
       "      <td>US</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1996</th>\n",
       "      <td>2007</td>\n",
       "      <td>1997</td>\n",
       "      <td>United Rentals</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>商业服务和供应</td>\n",
       "      <td>3.64</td>\n",
       "      <td>0.22</td>\n",
       "      <td>5.37</td>\n",
       "      <td>2.32</td>\n",
       "      <td>United Rentals</td>\n",
       "      <td>NaN</td>\n",
       "      <td>美国</td>\n",
       "      <td>US</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1997</th>\n",
       "      <td>2007</td>\n",
       "      <td>1998</td>\n",
       "      <td>CBOT Holdings</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>综合金融</td>\n",
       "      <td>0.64</td>\n",
       "      <td>0.17</td>\n",
       "      <td>0.81</td>\n",
       "      <td>8.54</td>\n",
       "      <td>CBOT Holdings</td>\n",
       "      <td>NaN</td>\n",
       "      <td>美国</td>\n",
       "      <td>US</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1998</th>\n",
       "      <td>2007</td>\n",
       "      <td>1998</td>\n",
       "      <td>Singapore Petroleum</td>\n",
       "      <td>新加坡(SI)</td>\n",
       "      <td>炼油</td>\n",
       "      <td>5.59</td>\n",
       "      <td>0.19</td>\n",
       "      <td>2.05</td>\n",
       "      <td>1.50</td>\n",
       "      <td>Singapore Petroleum</td>\n",
       "      <td>NaN</td>\n",
       "      <td>新加坡</td>\n",
       "      <td>SI</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1999</th>\n",
       "      <td>2007</td>\n",
       "      <td>2000</td>\n",
       "      <td>DVB Bank</td>\n",
       "      <td>德国(GE)</td>\n",
       "      <td>银行</td>\n",
       "      <td>0.77</td>\n",
       "      <td>0.06</td>\n",
       "      <td>12.74</td>\n",
       "      <td>1.26</td>\n",
       "      <td>DVB Bank</td>\n",
       "      <td>NaN</td>\n",
       "      <td>德国</td>\n",
       "      <td>GE</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      Year  Rank        Company_cn_en Country_cn_en Industry_cn  Sales  \\\n",
       "1995  2007  1995      Fremont General        美国(US)        综合金融   1.25   \n",
       "1996  2007  1997       United Rentals        美国(US)     商业服务和供应   3.64   \n",
       "1997  2007  1998        CBOT Holdings        美国(US)        综合金融   0.64   \n",
       "1998  2007  1998  Singapore Petroleum       新加坡(SI)          炼油   5.59   \n",
       "1999  2007  2000             DVB Bank        德国(GE)          银行   0.77   \n",
       "\n",
       "      Profits  Assets  Market_value           Company_en Company_cn  \\\n",
       "1995     0.17   12.80          0.69      Fremont General        NaN   \n",
       "1996     0.22    5.37          2.32       United Rentals        NaN   \n",
       "1997     0.17    0.81          8.54        CBOT Holdings        NaN   \n",
       "1998     0.19    2.05          1.50  Singapore Petroleum        NaN   \n",
       "1999     0.06   12.74          1.26             DVB Bank        NaN   \n",
       "\n",
       "     Country_cn Country_en Industry_en  \n",
       "1995         美国         US              \n",
       "1996         美国         US              \n",
       "1997         美国         US              \n",
       "1998        新加坡         SI              \n",
       "1999         德国         GE              "
      ]
     },
     "execution_count": 222,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2007['Industry_en'] = ''\n",
    "df_2007.tail(3)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* **将列名进行重新排序**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 223,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "columns_sort = ['Year', 'Rank', 'Company_cn_en','Company_en',\n",
    "                'Company_cn', 'Country_cn_en', 'Country_cn', \n",
    "                'Country_en', 'Industry_cn', 'Industry_en',\n",
    "                'Sales', 'Profits', 'Assets', 'Market_value']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 224,
   "metadata": {
    "collapsed": false,
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(2000, 14)\n",
      "Year               int64\n",
      "Rank               int64\n",
      "Company_cn_en     object\n",
      "Company_en        object\n",
      "Company_cn        object\n",
      "Country_cn_en     object\n",
      "Country_cn        object\n",
      "Country_en        object\n",
      "Industry_cn       object\n",
      "Industry_en       object\n",
      "Sales            float64\n",
      "Profits          float64\n",
      "Assets           float64\n",
      "Market_value     float64\n",
      "dtype: object\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Year</th>\n",
       "      <th>Rank</th>\n",
       "      <th>Company_cn_en</th>\n",
       "      <th>Company_en</th>\n",
       "      <th>Company_cn</th>\n",
       "      <th>Country_cn_en</th>\n",
       "      <th>Country_cn</th>\n",
       "      <th>Country_en</th>\n",
       "      <th>Industry_cn</th>\n",
       "      <th>Industry_en</th>\n",
       "      <th>Sales</th>\n",
       "      <th>Profits</th>\n",
       "      <th>Assets</th>\n",
       "      <th>Market_value</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>2007</td>\n",
       "      <td>1</td>\n",
       "      <td>Citigroup /花旗集团</td>\n",
       "      <td>Citigroup</td>\n",
       "      <td>花旗集团</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>美国</td>\n",
       "      <td>US</td>\n",
       "      <td>银行</td>\n",
       "      <td></td>\n",
       "      <td>146.56</td>\n",
       "      <td>21.54</td>\n",
       "      <td>1884.32</td>\n",
       "      <td>247.42</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2007</td>\n",
       "      <td>2</td>\n",
       "      <td>Bank of America /美国银行</td>\n",
       "      <td>Bank of America</td>\n",
       "      <td>美国银行</td>\n",
       "      <td>美国(US)</td>\n",
       "      <td>美国</td>\n",
       "      <td>US</td>\n",
       "      <td>银行</td>\n",
       "      <td></td>\n",
       "      <td>116.57</td>\n",
       "      <td>21.13</td>\n",
       "      <td>1459.74</td>\n",
       "      <td>226.61</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2007</td>\n",
       "      <td>3</td>\n",
       "      <td>HSBC Holdings/汇丰集团</td>\n",
       "      <td>HSBC Holdings</td>\n",
       "      <td>汇丰集团</td>\n",
       "      <td>英国(UK)</td>\n",
       "      <td>英国</td>\n",
       "      <td>UK</td>\n",
       "      <td>银行</td>\n",
       "      <td></td>\n",
       "      <td>121.51</td>\n",
       "      <td>16.63</td>\n",
       "      <td>1860.76</td>\n",
       "      <td>202.29</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "   Year  Rank          Company_cn_en        Company_en Company_cn  \\\n",
       "0  2007     1        Citigroup /花旗集团        Citigroup        花旗集团   \n",
       "1  2007     2  Bank of America /美国银行  Bank of America        美国银行   \n",
       "2  2007     3     HSBC Holdings/汇丰集团     HSBC Holdings       汇丰集团   \n",
       "\n",
       "  Country_cn_en Country_cn Country_en Industry_cn Industry_en   Sales  \\\n",
       "0        美国(US)         美国         US          银行              146.56   \n",
       "1        美国(US)         美国         US          银行              116.57   \n",
       "2        英国(UK)         英国         UK          银行              121.51   \n",
       "\n",
       "   Profits   Assets  Market_value  \n",
       "0    21.54  1884.32        247.42  \n",
       "1    21.13  1459.74        226.61  \n",
       "2    16.63  1860.76        202.29  "
      ]
     },
     "execution_count": 224,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 按指定list重新将columns进行排序\n",
    "df_2007 = df_2007.reindex(columns=columns_sort)\n",
    "print(df_2007.shape)\n",
    "print(df_2007.dtypes)\n",
    "df_2007.head(3)"
   ]
  }
 ],
 "metadata": {
  "anaconda-cloud": {},
  "kernelspec": {
   "display_name": "Python [conda root]",
   "language": "python",
   "name": "conda-root-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.5.2"
  },
  "toc": {
   "colors": {
    "hover_highlight": "#DAA520",
    "navigate_num": "#000000",
    "navigate_text": "#333333",
    "running_highlight": "#FF0000",
    "selected_highlight": "#FFD700",
    "sidebar_border": "#EEEEEE",
    "wrapper_background": "#FFFFFF"
   },
   "moveMenuLeft": true,
   "nav_menu": {
    "height": "12px",
    "width": "252px"
   },
   "navigate_menu": true,
   "number_sections": true,
   "sideBar": true,
   "threshold": 4,
   "toc_cell": true,
   "toc_position": {
    "height": "668px",
    "left": "0px",
    "right": "1154px",
    "top": "106px",
    "width": "212px"
   },
   "toc_section_display": "block",
   "toc_window_display": true,
   "widenNotebook": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 1
}
